From 21152087d82a9db4523fcb52143c62e68d1e61c5 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Fri, 29 May 2026 03:32:12 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: kakaocorp/kanana-1.5-15.7b-a3b-instruct Source: Original Platform --- .gitattributes | 49 + LICENSE | 73 + README.md | 238 + assets/logo/kanana-logo.png | Bin 0 -> 59023 bytes config.json | 36 + configuration.json | 1 + generation_config.json | 10 + ...tionary_kanana_tool_parser.cpython-310.pyc | Bin 0 -> 8112 bytes ...tionary_kanana_tool_parser.cpython-312.pyc | Bin 0 -> 13786 bytes .../functionary_kanana_tool_parser.py | 401 ++ kanana_tool_calls/lmalign_v1.jinja | 320 + model-00001-of-00007.safetensors | 3 + model-00002-of-00007.safetensors | 3 + model-00003-of-00007.safetensors | 3 + model-00004-of-00007.safetensors | 3 + model-00005-of-00007.safetensors | 3 + model-00006-of-00007.safetensors | 3 + model-00007-of-00007.safetensors | 3 + model.safetensors.index.json | 6378 +++++++++++++++++ special_tokens_map.json | 23 + tokenizer.json | 3 + tokenizer_config.json | 2092 ++++++ 22 files changed, 9645 insertions(+) create mode 100644 .gitattributes create mode 100644 LICENSE create mode 100644 README.md create mode 100644 assets/logo/kanana-logo.png create mode 100644 config.json create mode 100644 configuration.json create mode 100644 generation_config.json create mode 100644 kanana_tool_calls/__pycache__/functionary_kanana_tool_parser.cpython-310.pyc create mode 100644 kanana_tool_calls/__pycache__/functionary_kanana_tool_parser.cpython-312.pyc create mode 100644 kanana_tool_calls/functionary_kanana_tool_parser.py create mode 100644 kanana_tool_calls/lmalign_v1.jinja create mode 100644 model-00001-of-00007.safetensors create mode 100644 model-00002-of-00007.safetensors create mode 100644 model-00003-of-00007.safetensors create mode 100644 model-00004-of-00007.safetensors create mode 100644 model-00005-of-00007.safetensors create mode 100644 model-00006-of-00007.safetensors create mode 100644 model-00007-of-00007.safetensors create mode 100644 model.safetensors.index.json create mode 100644 special_tokens_map.json create mode 100644 tokenizer.json create mode 100644 tokenizer_config.json diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..21b3632 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,49 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bin.* filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zstandard filter=lfs diff=lfs merge=lfs -text +*.tfevents* filter=lfs diff=lfs merge=lfs -text +*.db* filter=lfs diff=lfs merge=lfs -text +*.ark* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.gguf* filter=lfs diff=lfs merge=lfs -text +*.ggml filter=lfs diff=lfs merge=lfs -text +*.llamafile* filter=lfs diff=lfs merge=lfs -text +*.pt2 filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text + +tokenizer.json filter=lfs diff=lfs merge=lfs -text \ No newline at end of file diff --git a/LICENSE b/LICENSE new file mode 100644 index 0000000..1d6566a --- /dev/null +++ b/LICENSE @@ -0,0 +1,73 @@ +KANANA LICENSE AGREEMENT + +Kanana Release Date: July 17, 2025 + +This KANANA LICENSE AGREEMENT (this “Agreement”) is made by and between you and Kakao Corp. (“KAKAO”) that governs your use of Kanana Materials that KAKAO provides to you. +By using, copying, modifying, distributing, performing, or displaying all or part of Kanana Materials, or otherwise accepting the terms and conditions of this Agreement, you agree to be bound by this Agreement. You hereby represent and warrant that (i) you are legally authorized to enter into this Agreement, and (ii) if you are entering into this Agreement on behalf of a legal entity, you have the authority to legally and validly bind such entity. + +1. Definition + 1.1 “Agreement” means the terms and conditions for use, copying, distribution and modification of Kanana Materials as set forth herein. + 1.2 “KAKAO” means Kakao Corp. + 1.3 “You” means an individual or legal entity that enters into this Agreement with KAKAO and exercises its rights hereunder or uses Kanana Materials for any purpose. If you enter into this Agreement on behalf of a legal entity, “you” shall include such entity. + 1.4 “Kanana” means the basic large-scale language model, software, and algorithms distributed by KAKAO under this Agreement, including parameters (such as Model Weights and optimizer status), machine learning model codes, inference/learning/fine-tuning codes, and other related elements. + 1.5 “Documentation” means the specifications, manuals, and other documentation accompanying Kanana distributed by KAKAO. + 1.6 “Kanana Materials” means, collectively, Kanana and Documentation, including any portions or components thereof. + 1.7 “Outputs” means information content generated by operating or otherwise using Kanana Materials. + 1.8 “Derivative Works” means (i) any modifications to Kanana, (ii) any work of authorship based on Kanana, or (iii) any other designed machine learning models that either directly use the patterns of Model Weights, parameters, operations, and/or outputs or incorporate a substantial part of Kanana’s performance or functional characteristics through methods including, but not limited to, transfer learning, fine-tuning, or knowledge distillation. This includes distillation methods using Kanana’s intermediate data representations or a method based on the synthetic data outputs generated by Kanana; provided, however, that Outputs shall not be deemed to be Derivative Works. + 1.9 “Model Weights” means a set of numerical parameter values generated during Kanana’s learning process, representing the result of substantial investment and effort by KAKAO. + +2. Grant of License and Use Policy + 2.1 Grant of License. Subject to the terms and conditions of this Agreement, you are granted a non-exclusive, worldwide, non-transferrable, royalty-free limited license under KAKAO’s intellectual property or other rights owned by KAKAO that enables you to access, download, install, copy, use, reproduce, distribute, create Derivative Works of, and make modifications to Kanana Materials. + 2.2 Policy on Prohibited Use. Your use of Kanana Materials and Derivative Works must comply with applicable laws and regulations and adhere to KAKAO’s Guidelines For Responsible AI (https://www.kakaocorp.com/page/responsible/detail/guidelinesForResponsibleAI), which is hereby incorporated into this Agreement. + 2.3 This Agreement applies solely to Kanana-*** and shall not apply to any other models distributed by KAKAO under separate licenses. Licenses applicable to such other models shall not apply to Kanana-***. + 2.4 The license terms applicable to a specific version of Kanana applies exclusively to that version and shall not extend to any other versions. Each version shall be deemed as an independent and separate work of authorship. + 2.5 You may use each version of Kanana only in accordance with the license terms expressly specified for that version, and you shall not claim that the license terms applicable to one version apply to any other version. + 2.6 You shall not combine different versions of Kanana versions that are subject to different license terms in order to circumvent any applicable license terms. + +3. Redistribution + 3.1 You may copy, distribute or disclose Kanana, Derivative Works, or any products or services that contain Kanana or Derivative Works; provided, however, that you shall: + (i) incorporate the compliance obligation set forth in the Policy on Prohibited Use provision of Section 2.2 in any agreement for use and distribution and notify subsequent users that such use restrictions apply; + (ii) provide any recipients of Kanana Materials or Derivative Works a copy of this Agreement; + (iii) expressly indicate in any files you have modified that it has been modified by you; + (iv) include a “Notice” text file that includes the following notice: + “Kanana is licensed in accordance with the Kanana License Agreement. Copyright © KAKAO Corp. All Rights Reserved.”; and + (v) clearly display the phrase “Powered by Kanana” on related websites, user interfaces, blog posts, introduction pages, or product documentation in a manner that is easily recognizable to users. In addition, if you use Kanana Materials or their outputs to create, train, improve, or enhance other AI models and distribute them, you must include ‘Kanana’ as a prefix to the name of such AI models. + 3.2 You may add your own copyright statement to your modifications of Kanana Materials and may provide additional or different license terms and conditions; provided, however, that such additional or different license terms and conditions shall not violate or conflict with any provisions of this Agreement. + +4. Additional Commercial Terms + 4.1 If you wish to engage in any of the following activities using Kanana Materials or any Derivative Works, you must obtain a separate commercial license expressly granted by KAKAO: + (i) Offering or (re)selling to third parties access to Kanana Materials or any Derivative Works through API, cloud platforms, or other remote access services; + (ii) Offering or (re)selling to third parties Kanana Materials or any Derivative Works in whole or in part, as part of a system integration (SI) or on-premise deployment solution; or + (iii) Offering or (re)selling to third parties Kanana Materials or any Derivative Works embedded in an on-device domains. + 4.2 If, as of Kanana Release Date, the number of monthly active users of the products or services provided by you and/or your affiliates, is greater than 10 million in the preceding calendar month, you must obtain a separate commercial license expressly granted by KAKAO. + 4.3 For clarity, unless your activities or conditions fall within those specified in Sections 4.1 and 4.2 above, you may use Kanana Materials or any Derivative Works for the development and operation of your own services without obtaining a commercial license from KAKAO. + 4.4 The grant of any commercial license under Sections 4.1 and 4.2 shall be at KAKAO’s sole discretion + +5. Outputs +KAKAO will not claim any rights to Outputs you generate using Kanana Materials. You shall be solely responsible for Outputs and the use thereof. + +6. Disclaimer of Warranty +Unless required by law, Kanana Materials are provided on an “AS IS” basis, and KAKAO disclaims all warranties of any kind, both express and implied, including, without limitation, any warranties of title, non-infringement, merchantability, or fitness for a particular purpose. + +7. Limitation on Liability +Unless required by law, in no event shall KAKAO be liable to you for damages, including any direct, indirect, special, consequential, incidental, and punitive damages of any character arising out of the use or inability to use Kanana Materials, Derivative Works, or Outputs, even if KAKAO has been advised of the possibility of such damages. + +8. Indemnification +You shall indemnify and hold KAKAO harmless from and against any and all claims that may be filed by a third party as a result of your infringement of any third party’s rights or violation of any applicable law, to the extent caused by your use or distribution of Kanana Materials, Derivative Works, or Outputs; provided, however, that the foregoing shall not apply to claims resulting from KAKAO’s willful or gross negligence. + +9. Intellectual Property + 9.1 This Agreement does not grant you any rights to use KAKAO’s trademarks, service marks, or product names. However, on a limited basis and solely for the purpose of complying with Section 3.1(v), KAKAO authorizes you to use the Kanana trademark, provided that KAKAO may require you to discontinue such use at any time if you impair the value of the Kanana trademark. + 9.2 KAKAO retains ownership of Kanana Materials and Derivative Works created by KAKAO, but you will retain ownership of any Derivative Works and modifications made by you. + 9.3 If you bring any legal action or proceeding against KAKAO or a third party alleging that the Kanana Materials, Derivative Works, or Outputs infringe your intellectual property rights, your rights under this Agreement shall automatically terminate as of the date such action is filed. + 9.4 You acknowledge that Model Weights are a valuable asset of KAKAO. You shall not extract, copy, distribute, modify Model Weights or use them to train new models, except as expressly permitted under this Agreement. + 9.5 The protections under this Agreement apply to all components of Kanana Materials (irrespective of whether it is recognized as a work of authorship), including, but not limited to, Model Weights, parameters, algorithms, or structures. You may exercise your rights in these components only to the extent expressly permitted under this Agreement. + +10. Term and Termination +The term of this Agreement will commence upon your acceptance of this Agreement or access to Kanana Materials and will continue in full force and effect until terminated in accordance with the terms and conditions herein. KAKAO may terminate this Agreement if you are in breach of any term or condition of this Agreement. Upon termination of this Agreement, you shall delete and cease use of Kanana Materials and Derivative Works. Sections 5, 6, 7, 8, 10 and 11 shall survive the termination of this Agreement. + +11. Governing Law and Arbitration + 11.1 This Agreement will be governed and construed under the laws of the Republic of Korea, without regard to its conflicts of laws principles. + 11.2 Any disputes arising out of or in connection with this Agreement shall be finally settled by arbitration in accordance with the International Arbitration Rules of the Korean Commercial Arbitration Board. The number of arbitrators shall be one. The seat, or legal place, of arbitral proceedings shall be Seoul, Republic of Korea. The language to be used in the arbitral proceedings shall be English. Either party may seek interim or provisional relief from a court of competent jurisdiction, which shall not be considered a waiver of any provision in this Section. The arbitral tribunal also has the authority to issue orders for interim or provisional relief. + +12. No Waiver +KAKAO’s failure or delay in exercising any of its rights under this Agreement shall not constitute a waiver of such rights. \ No newline at end of file diff --git a/README.md b/README.md new file mode 100644 index 0000000..f4255be --- /dev/null +++ b/README.md @@ -0,0 +1,238 @@ +--- +language: +- en +- ko +library_name: transformers +license: other +license_name: "kanana" +license_link: LICENSE +pipeline_tag: text-generation +model_id: kakaocorp/kanana-1.5-15.7b-a3b-instruct +repo: kakaocorp/kanana-1.5-15.7b-a3b-instruct +developers: Kanana LLM +training_regime: bf16 mixed precision +--- + +

+
+ + + +
+ +

+🤗 1.5 HF Models   | +  📕 Kanana-1.5-15.7B-A3B Blog   + +
+ +## News 🔥 + +- ✨`2025/07/24`: Published a [blog post](https://tech.kakao.com/posts/716) about `Kanana-1.5-15.7B-A3B` models and released 🤗[HF model weights](https://kko.kakao.com/kananallm). +- 📕`2025/05/23`: Published a [blog post](https://tech.kakao.com/posts/707) about `Kanana 1.5` models and released 🤗[HF model weights](https://kko.kakao.com/kananallm). +- 📜`2025/02/27`: Released [Technical Report](https://arxiv.org/abs/2502.18934) and 🤗[HF model weights](https://huggingface.co/collections/kakaocorp/kanana-nano-21b-67a326cda1c449c8d4172259). +- 📕`2025/01/10`: Published a [blog post](https://tech.kakao.com/posts/682) about the development of `Kanana Nano` model. +- 📕`2024/11/14`: Published blog posts ([pre-training](https://tech.kakao.com/posts/661), [post-training](https://tech.kakao.com/posts/662)) about the development of `Kanana` models. +- ▶️`2024/11/06`: Published a [presentation video](https://youtu.be/HTBl142x9GI?si=o_we6t9suYK8DfX3) about the development of the `Kanana` models. + +
+ +## Table of Contents + +- [Kanana-1.5-15.7B-A3B](#kanana-15-157b-a3b) + - [Performance](#performance) + - [Base Model Evaluation](#base-model-evaluation) + - [Instruct Model Evaluation](#instruct-model-evaluation) +- [Contributors](#contributors) +- [Citation](#citation) +- [Contact](#contact) + +
+ +# Kanana-1.5-15.7B-A3B + +Introducing `Kanana-1.5-15.7B-A3B`, the first Mixture-of-Experts (MoE) model in our Kanana family, engineered for exceptional efficiency and powerful performance. `Kanana-1.5-15.7B-A3B`, which has sparse architecture, delivers capabilities comparable to the `Kanana-1.5-8B` dense model while utilizing only 37% of the FLOPS per token, making it a highly inference-efficient and cost-effective solution for real-world applications. Furthermore, `Kanana-1.5-15.7B-A3B` is powered by our newly enhanced post-training strategy, which includes on-policy distillation followed by reinforcement learning. + +> [!Note] +> Neither the pre-training nor the post-training data includes Kakao user data. + +## Performance + +### Base Model Evaluation + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelsMMLUKMMLUHAERAEHumanEvalMBPPGSM8K
Kanana-1.5-15.7B-A3B64.7951.7783.2359.7660.1061.18
Kanana-1.5-8B64.2448.9482.7761.5957.8063.53
Kanana-1.5-3B*59.2347.3078.0046.3446.8061.79
+ +
+ +### Instruct Model Evaluation + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelsMT-BenchKoMT-BenchIFEvalHumanEval+MBPP+GSM8K (0-shot)MATHMMLU (0-shot, CoT)KMMLU (0-shot, CoT)
Kanana-1.5-15.7B-A3B7.677.2473.3579.2770.3783.0266.4268.5548.92
Kanana-1.5-8B7.767.6380.1176.8367.9987.6467.5468.8248.28
Kanana-1.5-3B*7.016.5270.0870.7364.2980.3656.7059.6937.60
+ +> [!Note] +> \* This model is not an open-sourced, just for comparison with Kanana-1.5-15.7B-A3B + +
+ +### Evaluation Protocol +- Base Model Benchmarks + - MMLU, KMMLU, HAE-RAE: 5-shot, log-likelihood + - HumanEval: 0-shot, pass@1 + - MBPP: 3-shot, pass@1 + - GSM8K: 5-shot, exact-match (strict-match) + +- Instruct Model Benchmarks + - MT-Bench, KoMT-Bench: 0-shot, gpt-4o-2024-08-06 as judge model + - IFEval: 0-shot, mean of strict-prompt-level and strict-instruction-level + - HumanEval+, MBPP+: 0-shot, pass@1 + - GSM8K, MATH: 0-shot, rule-based verification + +
+ +## Quickstart + +### vLLM +- `vllm>=0.8.5` or the latest version is required to run `Kanana` model. + +#### Example Usage for `Kanana-1.5-15.7B-A3B-Instruct` +```bash +vllm serve $path_to_model \ + --served_model_name kanana-1.5-15.7b-a3b-instruct \ + --max-model-len 32768 \ + --gpu-memory-utilization 0.9 \ + --port 8000 \ + --dtype auto \ + --disable_cascade_attn \ + --tool-parser-plugin kanana_tool_calls/functionary_kanana_tool_parser.py \ + --tool-call-parser functionary_v3_llama_31 \ + --enable-auto-tool-choice \ + --chat-template kanana_tool_calls/lmalign_v1.jinja + +curl http://localhost:8000/v1/chat/completions -H "Content-Type: application/json" -d '{ + "model": "kanana-1.5-15.7b-a3b-instruct", + "messages": [ + {"role": "system", "content": "You are a helpful AI assistant developed by Kakao."}, + {"role": "user", "content": "Explain LLM to a 5-year-old child in two simple sentences."} + ], + "top_k": 1, + "max_tokens": 72 +}' + +# Output: +''' +... +"choices":[{"index":0,"message":{"role":"assistant","content":"Sure! Imagine you have a super smart friend who can read and understand lots of books, talk to you in many different languages, and even help you with your homework. That is kind of like a Large Language Model (LLM) - it is a special computer friend that can do many cool things with words!" ... +... +''' +``` + +
+ +## Contributors +- Language Model Training + - Yunju Bak, Doohae Jung, Boseop Kim, Nayeon Kim, Hojin Lee, Jaesun Park, Minho Ryu, Jiyeon Ham, Seungjae Jung, Hyunho Kim, Hyunwoong Ko, Changmin Lee, Taegyeong Eo + +
+ +## Citation + +``` +@misc{kananallmteam2025kananacomputeefficientbilinguallanguage, + title={Kanana: Compute-efficient Bilingual Language Models}, + author={Kanana LLM Team and Yunju Bak and Hojin Lee and Minho Ryu and Jiyeon Ham and Seungjae Jung and Daniel Wontae Nam and Taegyeong Eo and Donghun Lee and Doohae Jung and Boseop Kim and Nayeon Kim and Jaesun Park and Hyunho Kim and Hyunwoong Ko and Changmin Lee and Kyoung-Woon On and Seulye Baeg and Junrae Cho and Sunghee Jung and Jieun Kang and EungGyun Kim and Eunhwa Kim and Byeongil Ko and Daniel Lee and Minchul Lee and Miok Lee and Shinbok Lee and Gaeun Seo}, + year={2025}, + eprint={2502.18934}, + archivePrefix={arXiv}, + primaryClass={cs.CL}, + url={https://arxiv.org/abs/2502.18934}, +} +``` + +
+ +## Contact +- Kanana LLM Team Technical Support: kanana-llm@kakaocorp.com +- Business & Partnership Contact: alpha.k@kakaocorp.com \ No newline at end of file diff --git a/assets/logo/kanana-logo.png b/assets/logo/kanana-logo.png new file mode 100644 index 0000000000000000000000000000000000000000..e446d47b26e8088a789f6697b4d549d043db941b GIT binary patch literal 59023 zcmY(rbyO36_%=KcM7l##Kn0{xKu|y$N$D6NAl;p#WAqoL+acXCkimvZDcvJS*XV{( zkH7Q2zek=w7H4PY+8f2L4MrYL6pOd(6s{R+;>*wkUW-}K3!&nc5ewrQ9kT4w2)h5yA*^WLWd zvSD#Jv%VMWq@QY|LsVyDpIDa`un}R!+i9{1%&G*J_LqO*82VEVb7?(?-|@S;ZLhl@ zebSrAp1pf}t^*bfi$B&6dXNst!3$}#xaq|$Bzi}rkU3IP|2W5e9#y+PQ`=2QdDV+4 zkW3nr|gDXY7BLq_SuQfv}+>Kq7?(Eoq5c4^x;gr<|Eb!GMWGXi5MH# zYjNRP*f{nFZUNa;pHsw5iBr&IZX+s7jLTBP0iWbi11{MBlS!#Ev(6pWrM)zQVlB#9d>`kru z2UI`dOUM-eX6NO==M9R|^V@lY$cjz5Ga$fQG8q3&Lm>MOU5)Z=lmr~*mxs4ua_bT%?NO+LD6YWOdk=Tul7G2aIq>j$#Hk0e$dQ^fu?xL<5r*ju zDtk|Zbh!l;N8QT>j`#%H@jLiX7x#Om;K}&qhtI#Mm&u=&g<%ZfRvz}{8EJQU5_T$A zI+rke<;OkNd@pZwKs8hSYDsLMj3JWDU%`ZB)myl6K*Nd2?|;9Nk7y!@#B zFB9B%rVXTT7VeDOXhNTTQul1^LR-I4(Q!G+&QgJ+x4|ctXGWydxjLvRM%#p~VjFT$ z$;sAiyj)7NR)cE7=kx9?E&a=)?&H903#lKbt?wC=OC|s4AUAOVeeJ>IHI=W$@0sK< zq=1jU`?;~~2SBp9GAS#i_h_^Kh=ys2I2O5NQbq2KC!OVz741zw=5@h8tB6HYMqHII zL@4e5DKpfg<37*!pV;vJI$_h*$p0nqbw-!-CZ6-<7zaTM6i70%y zBbB19DFL5&yaOubXTgf7Y&vYwU-U3(X><~zyDDqI!ofI&{F!#UR`a3VH)-i}D)?i{ z?Lw>?Fpgi%Yy%u-mzG2s${~Z?ydFo;H5txndCbBFEeU0s`wh@nUz4S*JTf`=7vwN>T@o(mRg!wg6@m z`*e-W%RXS4Vb1x;IM08}o~7G8Y;%fQ-&GH7sHNxWE&HQrr}>?r-CSsn;_O3=>f;it zv4P~h_#!8xm4MwBvk90wnBM9QW;Q`y|FW|FYh`M|ZT{`i z-o&H1cm9i|bIyHnkJEveGba)y% zkJAKD2bPUB_A4V4r;3rgf_KF;nod^7WoI7w1~eMX9@hD^0OPyUIA13;*?l`7IIx!9 zO_-r1@*_@cLcNW?NdL~w#1uWVsHlV07j!$!Hh~<$2b6`sc^BH;fL>o9uU_9KNdEAU(_yLb0NFJjqn|6*B%S7tE;xwDh74`E@@HD;?F2Jm=?CA)#_MtX zlbhYKT*`Fez`tvX?aKXBkZH5Cg=aYOb;=)~_pXV+-EMS)@&0tvb+Q!j+9L$(?B1Id*e|@mO*v%YuPl44BVxx~v+s{V#ya4$RcZ?Us#RD`n(N(s43fXL0AQ_#@ z@9_G;?U!YNJZJ=Y(cb0SjFTK>C|1TrE*`kj*b7`Sw9IOREC4MNrw4Y=zIRZT5WgJS zoAWkBwk*S?&iVk=w=>ZPy=Z3ge<5~1V2t@2Vt8W!^A9z^P&`3@If|xQ)?~6)u*9^x ztQFf&_WPt&#kT-Ef{iLMXoQE#BU&$5{%nx?Y#PW)>a*5gQ{0Upy3>)C^b`6avN7@y4}jzqdwY11 zD9=4OR2=xKP^K8mUzHNp5>TbH9H??8>6^$=3yH?ur z=PutG{Fd~kA{+u9$NodB|H2oCaZc~9i{>2wdHJ8ykq|Fd0;jzs=L@Lo}Kjr`)}wV$dEOTd&Z zcPu>B0W|KsP`zZSg$EUo=o^ap^?kaSoH##eHz5R;543rN<_+d;4QUV?j+JTd7IE~u zDX%L&6OGt6ekERQ&n_CyGg}-S{TL+4+G~tyj-@jd&L1%o20i|fI;5#{FXbJ6g%YBN z;3sFoPX$3bO6mDkN(XZvp9;s(GVM<1zU=-O?4=1ZMbisMXRg9zNgsA^&T`8CoACcZ zm)_x?uElW)!Jqx6@44AXyV#Y3B*lz=kw1-colk{&G$s)ovqLZ$@1%qYKsq|jTD6(X8t-9O7ursBT)`{v`DRyiVXBt&#@DrzaZ|+Z^Oe%6Idp1u9 zrsl1h=6z=3#d}_Q*B@u{36t@|c)V;#5C^D}mOyL{<61vEO?c!x&Q@vjrubpSHy=Cs zrshsteF2uoLpyKeKe4>AVYf4?RB}5nKX#14(C{9@xN?%@KPQ1t%|EH@<#V0cKr>5? zw*xoxq^_Ps?Arv#qVE;jZ!t3In|9aElMyA`@qA0I2_q3B%^eTCu>f_{QO`RxPV>D1W8B>E5q}|c4wc7uJp9$o3 zo`Ve}i63vVmtXsSP!&57glI$6p?pPLhaU-xxoqXFVqL_u-cPT*Wd@gG9L6o>E@?uwb~jZF#S5LL6PG;rn%HNdy{^WB7tb9suyxe_}9}2bi39} zx~w|>n4`5$Vpi_thSi7vSE_|n!c96q0>lLvQX%IlJrCsRlcinXrTDyQcCxkYn0?b) z>wxTON*dYJPf1PG59*9^Nes@imsmMznhd+2De60j|1 zm0L_^A(rOF3j^6S+BKQ5x(7;OfXBI(_KhI>0_2Y^5Aq*zFYn{{r-dm|>6@D1vnmzV zZl+EH@OTJsxdYEnA64)e1ZF7u)ie%$EWfaMHU8>8-Z~g^7Vu$wX^U>P>C~^$&9+pqS9=0=l*y5;8Kxg7y6oh}&fZiw)Idsoz zC4B+K*s+wnU47L!)~@;oS>4y>=IJ+vXGzr1e^~P5V%s^vX2$(GU&ke0s$`#TV4Oc8 zH{`ufrkkm3VbIZqHl})J5a2=LrY~v4HUjk_7!CQ2Hdx!ce zYE4t9o8zXEizwT4*?y0{odgdHPb&b%c`o6s9xor%=cgW{e$EyT)a>!+-I(&}fSmTk z^sVMbPr6QuF*fWnWWQdg<2I$aBL9Oh>raR}$0S0tr#CKb5D_Zu*7xvjTJ((Z>up0m z$l-D5#;0$upELHAoJK< z;u?@;;LBKlbzlz%ot0?{%&Ny}3_NPqb(SIsY*M_c*zR?lsn11c^Cg~;qTk}^l1?~V zbzkSqI@^*IoQMLNv5b9_Nx7c=3rO^jJht)Rvj!IvX^OGXEzPlau||r#rG}bQUN`}1 zm3UjQ=9jGXMro;*oy%BdmgFdF5aYGS#(K)c?W62O-XWGDAJE*%5IBNmeX40TmXjsU zIgbL%X~4yqs!<;in>TkNHtwVkg%e;EDWQy7;kH|TIb|a2jSe~69*eTd|NQcswXVM4 zR#ftM@^ZMyKa+Rv%&RVmu=z@?Os(-Z;|GE%UO_}nl0wVN=n$iKgOa|-M0VKH1N?Lr zH#+1~Iniqk$A#fsZ1yUTkdaly*kVyu8YL;2tq)PfJ*DudMF%IPc>G)5Gudw_ob|!F ziJ)HV*q>_}LHK=-`TkKKSv^HS%!hXT#Xn`qy-rwSde}2lb-e4bpSXzy5zpw8VkY!} zHI4;3-+^qqI#=40zU3cDrWhXjj}??Ud?G0CJ_!;oaHNtHg&dW{ZfeUNE_+zAv%PkD zj^F;G=Bl?wVk)ykdMeMIuXsvm2-B7(iGiy)dx)@%V;RIqJ<5w_qHvxUl9g7Se4yf3qzP;p z7Er&Gl{p;T?%H+nq3LmhVAm}p3&8lAQ1#}Y3Nj@BO^5jdoN*R&IKs}YE|>BQ+g^2c zn?8D3*b?28=Q=}?%8?F@*v0poypl9+Y>h?L9Kk!fsYW=~6<8$l4i@!zje)nmEhn=W?b}{w3^xhW&9LlD?bc zJ3(tD)n1)POnlAf9o`;78C2E5SIP(fXi5TgMEeRe)4I)os);l%GsB34#%9RHGt`Xj zEH7)T)q;O%iH&SNgFd4OTT>5??d5c5=DBS<`3Yu#Jl*Q<=A#DWin+U?SE3zYd^^Iw zgvM%-`*$p*F2LGt_qE|}fFJHh{NtFsbiC4*QE{S_?%8kea<$stFV~E{O=-k^-U}iT z<;F?8H+$O*x81`n#tCKXBRr%(n`+i)PrB^i{8Zo@@&He^csVv-*A1>1wD>$TLK>U@ zWqeKFhJhzi3_*Hc#I2JVsW*aae*C8an-v@1W8X<;aRi0&2V~|g>jKh)w(QzOY8dVX zO7aWa_}#3T|MA-ph7fSd04WRgehc%Xfzl0Y|3@#0m6bVOes-CS^Cq!_=t;yk%^-rv z?A&(bz6GFNcVz{(Pu-Hz@7j`S;Yaf-aLSntxtUtWEsx4s;F|XD6N z_C|yfX1z^cvu7x=VXKwEa%J%JePgf?0IBa8_b*&zU&^@5s__n=XsMj+;wmd% zr1ThNRCX%rGbZXXpYf#NjUXwf$St2OCd9z2{7xiejtnM{pl5#bj=>Isb5v1dp@w_J z8j>?gv;vX`#D@@ESfU6J}fWzLeg$kE7T z$QUo{civxJx43j+(*)#8fPT)UGVD5CNf8#RG(l_1w2scSN<9s%)je407p3ZSCa8rZ>uXu;; z*z_*jqHKH@&R>8Q)Z~lXzz9nsH{;Ng-=hlVcPxt{>>lkF_EbH(jglB@7nDX)WS?%N z2}sQJxPFXPdxeGvZt{lu#D15AqTqTAEthalMGWGod(5d)Y~U~$O}7{Ld_3Dh&-*Rj zy4JnPt*Xt0UwvXMQ1+OQoIT+OlW-m^LG)#6+tp>k4)k=}*<;%C)(yA{u}66M!`zS~w49kv^%r|VOnSr|$UE&1q(VNhUWvRUiNnUbIn^cdfL2q6 zn_6X+)ilk0U9-a$GE`UKi*~jb$)=Oi6I)(&r87MrXEN9f0z?La_8ypS5cX@!dDWaAH*&eElt4tk}=rdtNec;EAdC z7Y{(Sx@Ype!b*3lS$4TwWy^dd6Ktmqxy(y_1-V2eW3}7EISvHmr}23P%$Y1n{}5^+a6S?*uVL z@ONYSye(B}R>xkG=3yZ=fFV+sfP>EYv2NSL9v7_k0EVf{7YEtFuT#z?OZ`?aap5G1 zH)#MA1r8~ym`R~t7aIX>g!*49fR>p z|0?zo*CWA6t?}UVI2U8U0kvTv&`xlYqS0L|)tDm^1vcX3Lj_>Hrt+E&LE2nYVj|7^ zjhSPEtgdGAkTp3KIW~f(0yAoPeIdp^POY5!*~~`Ygl9{SCZ}K|fW5hg)wlSIcr0C^ zhfri_`&ClN-F6eF&h0}@N%=)5CmtOSXZh%wj~eI5?R}Eb<&asOu8P=;mm;41N7kOO zKZNZEKV6;F@$NMfPrXS_r{qhvl}sKB!@;FT9(aWsiPWU;u0r#x6Tmz^HgCu*`y{QZ zPo0hVX)!V>tZ6InrpF|kP*s=lsnQdEmOxOOP@KJEU6ee-MjIbwM1)DoP4qyYpQ$o~ z1VEbiFbEU=BT0faQ1e!~(m~lWm!T%uwyii`Y%(~u9mR+}+{-SR{n2*f%8KEg7pi*_ zdSD63sCJaNqBKhke9iTbxeOowEw3L?9-}1u=s4SS2N_DrOk{#&TGdo=Ci5%YCcLl!8qWo94na!$ zLa8hu#tTu@JdFi#+4nH3Rt#sQ!Fi!Po9%OR=c(9n&MXr8SkHKfdfno3KQYz0lo}aH z%5iU2;MV@z_-q7&Rwzb0l(4A6gciYdQMK_3`DA@ct~aJlRiNQUN3X^n?%DN~P0V;R zexljerg_5Vav}vkUH-mGH4^A;My+4Lt~4^B9s7gG-ps?>({n7FdBuE)p zCGXJ#&UJyP^nf|oBpmwNV!xct(_xO8!#*%JqmA~=V!??4orKA%ntTm#?{G*YEhELf ze>yCbN<>dqgR3;pM@0(l*CDmlA#G{I;h*N{2LBiT(4-{sSem9TE{m=lFThCSP5isN z5G~3Po8MpZwEHT-F=)RAwoAQ)GZag4~FH-dmeQfAjSA|#c{z3S+sG3 z8^ze=I2tVv^-M(Zw#*o3`ul13Cz>(ok~7;n2`e{Q1&7=Z_+MOo9s7~*N2J)B3(PI8 z2JN}=5gcQLMiKFujwTh62_I)0CtGzT?U*UA5~ov!SX_H@Gi@Zkvk=X~>|nL}xn}Ac zIC2VQU&7Yh{g{7{OvjL?4uxF2lm8uvmENbAHYo+RYFY(trxzp2Zu zu=4!RpStQgN1FY#?@sbChM=k}zHSPEXz^qhiS{H%>qd0jnJJuc>_szVu_%eOIyr;H z^KuUBJ91Tr^>0_6P>;`V(DWbfTFmk>RRD2o>TYdTZq(!ET$|Zgwqi5d|J?<6%3|`M z!)3q0p)kB}1i4cZ8xqn?NRI!vWFom>q+ zsmS`erxS19NcmjmKs*gckbnB=y0`-(idQTjH|i6OlE}w?h7T)Z>s7*I;dm(s>|IMc z1~&tRdFy$cQ;t1naJhXIaPxGKXME#HwbhUkjSFzYs$4^R#xDZ>QF-OiVuhw+hSp&n zyw&2Vs&n3lKKVfTT?l>;_*t3Y1Rfa>1;MDC1%LHo^v5Xr!J4O zRqYhcRSaY>?Jb;aaqZ>TaF4&&xrFvxyK@mvKC4rn{ygGj1t`y!dOI6& znH>Et^9;8X`BT~I(~?Q^B+O_HWKt-3^-?%jb-`A?d)@dIW1XPl>wV-4y7L@!4@agW zct!J*%BzkOXnQSt&=Cs)^e3P9AB(aI|8=Gu0gl6xWBY6oMLA4KA-|G$_YZ7hRk^;7brO& zOm2sM%ZwgWC9|v=pj}BdEFH>Bt2G`M+uln+zN}kV)t_oj_>~`X=0599bSt1}@x6>YA|zGAw)DK8>_Z z;LhqY03+ca(D=(~zI=f^GYk-)1ypAAG-5&E0|OvxGhsE(s!yEsCO`n4OB~-M!6h`Q zc{9O{owSeuU5RP!J?5;FbI=zMVLO)i>AUpk1V;KXo}IDbx*{vlVKl(9GbTtG}U+;$P_TbbRm*z=yR$TAt!WqiLI_{FCuWrsruU z(yzBQXTi<3<|vW2nAjrTAcFN$)_H@O!Ef|9`h_U$x1sa;3nZb%)PH^(vh#fdmz7A9 z<_7m-+G8TGg~>L5mco;kH!el}d>apP=DTOyHkv@rFFIlGS7j{+wgAShl*sU8DjW-C{d|&J9_TWd=$b*eyg(u1p7CoL$Dq-YfCX?Bi~BIw20=?P5+KIKD+= z2hyNR)v^bi^6ajNG`m_VoWU!g(UOgabGi(ah$p(MHw_?6lBYnRFUkrYGZJ zEWiqXlfb2>AlDu7bq&0bp8fj1HG0F5%@6rKopv7Z=Z!Vj^v6G6xX29#P*;Fw0)DnS zTUTv-6FhpomcSNy2Lqj2%+UTT8llV_S$NWDqkDtA=~6XR zX*y1dV_w3*#}*+(>BoK7n0{`I0IsZR=pj7c_+Xy=r)ZEl3JMN!2UVWZ3k}ao1{@D> z^a1fa#Mg1^V`p_Gy^}_))qI!v7Fq5H3uXETfE*K*7)Pu1rfQREq!Yt6%r>PtkWXCw zL(#zVtJ218hqqF#A9JSSmIk1dyR)Y-K7!2l{h>$qI#QubJ{gJbxRxKWR9@`X+9V!w zZ;*l^tZYnLjEoTFlK2vKlh7GjlgZ%3)9+%V&GnDBPXx8ulCG4d6+V4W@0&el3b}lu z@-hiVxobB4<#f3%3sG zWIqj_7q!fLrSZ52Gtu$ws$|6U4MV(Oo7?Io%k9IHo5x@89lkstv*{oaWFx>8EnrFp z%8yuUN)X}G(U3_uSikaDjgq;|X9>;T>7k-_k+)MZmx=|Sl|nv+gKwMIKGTAyaEE)M zlOpp}TFE0ROckSj*puWFHZFIfK1>}Z_CQ8~Hz(JGEafn;;(i|c1~VUN-k*w!b&Kyg z{1S&E_~!_vxW~GNL|(vc$zHF*xL#I4(Thr+j+ z?;gZ^Oy6GKttIiFglYGi&w67%3no`m)@W-*esiU^s9}9=eaXuSou{PdC7)7&Qn0jk zfazop4`imj$;A&_YpO6vJEPV0P_&l%3-BjCSUbJ@R}t}V467=<_OG(s9G2AC(lPav5~Dii#_^mx?2cRVM=%)tiUX2{+<7*n+d5=Mov zk|~GID@kkN_x?it7gR{qWc3clj69Z298=7s-POsl=Qk#-Ya8!KZSdB)`apl>BauHx z@-AIp632&mo$-sAQNekq>z1<{UnSVb<3Wdl^5;qD;S_yI09Hr?@JDz_Xbl_%I;;8f zVE~G13vKZ>ZJ+yXBsz_WDBeU2?imOJxl2^d4fYR5BE28fLbRmDWFQ$1&X-?w?i z{hu?(7xO=mX3g?jT8mX{`YIvFHK*3{d=A$NHM+Q#<%0|jQz}?W~xLf1~F+2}{mw|9JKj{VeNbm=+*5+Fw~2>vef-=?so+vMR1ZUb2yKQ;{T7GH+k+ z@6+LIe5@_$LW@9l3m-D^u?|_wbPW*FmR6VVqyT61BY077wZ(v1-*@N?qAt1u{)SSQ za|l%VmhLo|V|16o4>&*tJTSfWpV_o)V$^Zkrlo`hyOsPthHTTXpl8i_DCUV@>u)p) zuhV&8wwjDm_|_>DMxm9zjkDFh=CSVHQ}>~DFKq!;xD`kxm}2Nv)s+s!iV^bFi(^EL zFj36?E#X@D?o&|qU<~I`26N|Qx%O_^_i?3XbfdD$+g@}+U-4e%syYl<#OrPLJH^?r zCsQ`P_|tk7<2WMzP!BPizz)^ntf?w5-4Y z5;#C#-i{rr0f947ql)~?w7#F*MSqPZOKn9<$4`zdO~|V2Hnu$rBW0igv9C_NVljGg zMb8EoSdyEzVXvd{V}Q7~OZ7L{fI`CEzq8aKZ@XzLq)m9{JC74NQD z9Gra9+d@KUr1*z4?kR2%QCBxiUSCOsW2yGNg*c#X0~KPn-NgNYYc20P@jjB&(!>&T zhY@G74*FIkLvvYXyRE{jPQgH+L+c`@m?dWd+{eA*wVJjrTf0{-Vhb*IxifAggY?O>z8z ze^IXR;-k|e$4Onaf8B3lmea?#@Ce#1`_w+L7q6wa=4|5cd2Xa2{*=s94T!(Gls0~N zuQjz{9;DYK)Ueo{92*8z`Hy`l0N3PwV3#qIG-Bu34P%+h5H#b^)Sn58?6GVymt#9iOn*Hw84tE*CKXnwf>CZh|9YxVtt)(Z6#s6(y1#B6}mD6y&P$oAntu%6@wK8hd-!dnl zl}mXOwRtKas4TG&K9o)AA1>`evMJK_JY=MrppMqcJz?;#v;CWwHnThqgBE=dl7S>g zaD#|?wMG#kxsxCl4jGABPl088B<8JByQ;NZX~4jal2f}I2oKs_H(9eb^u0EBzt+B? zdU}D2<b8JAo7hT1KM*E^b&Y5W5*cf{%h*&JYE2X)14cHx zj6eA^XlJr4H$ZLSo1k)!Z@`h&yhTZ(XOLyWJE()jTL<+Phg7Hzggl{;W542o!wtv36Z*>o!`(q@q7$r8Gse|_a56#M{p)}J$WhTMULB!bRyOe zZ;IH~?K%;23VZx#fox079CgX`?%6siyVLp^**|tM#A_mSGh!>u(2R>|k-?3p-Sv_? z8`ksrO}-QUp{o2whrg;f!#%S^5U5!$7=!lmbaw4NVC&INX?<4SGcJxp#pX!S{~*K! zXN9#?$Q!YpI@S$XyO37XQph=Xs$wEhY?Npv4*V#~K903$Ns1S^&fOtwYWk%Vg2A$c z$0F)J+x9@(z2g13XW%dfSx`Aoan9GJX+V`im1gmh{AZx%rdNynEA^Z)601)bfrsoP z_u3=W^x!X_XQG*x{5)F*jnvDZ1Of_@vJ@Uo@v3r+)KPR0S!uV<5N<%}q)vpF!Sb3) zg6o>m9_I`s-A^OQ%+_D==MJoS>1}4o6TC;Au4m1hBxAZfW!${yJU*tzNj&f~ZQorQ zp#DqbTX@)#SJVOX^R`}4*5rjQ7qWQMBDMMUE3(nchFK$oD!yet+xP7z?TE{?s=A6_ z6wn4;2aN%H4!piF-z!yr1o14rbn3s;a5AB2CoVdBe=I=~CkS^6G3f#k7i2tEWPi6C zEMNNN^*HQYz%+hM_Ps-$Bnia(gJ7Azkg@@b=gG3HupUc#9zi`Bi^T^SM=DbG3BR=l zGUk+B^LQTE9{M!&S8RE6vA~P|nWLjC(O2^->xi)*mOj|Q2R%-8vvX1u`P;v5{XPDm zfu`Yg--C9?1dSP6ZemSLa}0LG&cQ~CZv{1*-g!EP&WG4Pa{X>odAjrGI06?MP_S%Cv4?g|Fg5$S4D11T?EHn=&=4V-L@G&kFsdIlawBesDwK%-gKQ#Bo#Jm*1%~ z_hUvp)@*h)KS=g?ew?dgKa1_Tg|s~Y;B1E$rR`3zAN))4N7E!S+R)LKP4FqBnh8~T zhq%89`cKr+Ea8e3QQ6LD{MoLy-MEZ*a<4r8O3}OdSlj)!a-7{;bBL_u1y6U6j;VS8 zT_MGC*KqOFiwJ+inxup-K_983sUxf$`&8F0^1j7&w*|Y!@N>MtEmGYR9|+A9Rz~|P zvWWz7kmSy9$3pGe!GL+cwE06;!fewwq)Za1yY>e1NhhMM1gsk$1=9wY6SFMgc@uIl z3GW|IJ~E7Px|DvH+^nq(HWJj=k~s$Z{2&YLzT~U{&V+Y4qkl z`C~@?yi+?~dwp!P1-_Y^(eH#Wji$c5#jE3&!kNel51ir}c48zVN93kjz^~52YsH>_ z&kA59e;v%>x`crLhHiJ^u{^psVo9?peRfU4*2*zKvZ{3F-YN$bbTnY#@X(v97i-qw zGv=L~kMVX%uyQhe_gqdU7=(QJIhf(-aV+}U@7Pwp_TQQ%nNY%uXmP+QV1x%{|8T1! z9(&hQo|@cAF2ROcKlZ1rr)bLSG8Wg@zc*WdeG7E?%H9zNJ~pR-E_6K#pKDga6T}Y? zRIC7!Ul#w`joSpWCC|9qJk{UGR)`-dnBEvb>T zm!@wasfFXDfnxe0Bb;U!+Hc0LDm^DFKVnQ7U|RyJaS7nH0KOF7LxFEE2{n;1LmdnB zQuOomFR6Os_3u&r*!16F?Ab6Eoa+Uv>&STn+lb1~a@t{SP-eSCN%$kS7j2A$n~=~q zU!{uc@XSpHW%>)s55J9QJ<(ah$aC&JfgwjO>M|5tz&`~U5};*7qVmT(?Nm!^&*fju zFvvc^e%(N9?7w=^bsRLrP8fK5?$fuH{d&N<*wYJM3<=VfcQycc%Uutb@d*`fPKfOt zns^qDl_+6MpTbdc|0z!TqC|9qt6l^buNyVjb$aeMW8K4-_y&_05b;+owv)&2kHY0V z7L@n3**-q|#F5-g8|tMpA~nko>0Nn(u#)nwklX%c$jxT3>ddma{vEhOvYPj7%_x=2 z$lds+`a~?IUKU0mW<_o_OSrg}0R(rfOVf)>{pZCh$}tWjmc$Z_;FEt(bR)*Yjt)JS zV048kJ@kBg@i!upcUMBGDk>PJ;r53aC{*lil9m{sCM0lgKW4aIjnWGkPjJ-~6U6RN zncb!_o07a1cgvO{1iw4y#HnavszRmi>(w3KGfDMpx*AZrL6(7BjQ-2(?URwv>CYix z6V|~8AGieS$@s4DbduMUp}>!1vD`_Y!FI8CoX_3@48C0wcggC&gqxnB6y8@m$q;ui0>+wV7^Up2&uMSF>O&3Mmvzo<( zysx4B`2lP-AQ1E~Wh@D^jqtKEmWoznah8N>qkhdivGpUf(9yi|`qsiIeuDI;X@v@y z=GUnEyS(4C0*bBsO5MXy`+i2W>50R$H%0_ch(-ny^hm>N*W`EquDp^VWp0C2rqow- zHA@Av)`VOFw9R^69V@I-MMx#p-16MydDQp6H(L>kadYJm;Dd?3x?8 zk^hx^G1%SehuT(s+m$3}Lz{fle%voC1ngmbCdbuPcu=d+ZlNmBnW5FL(~89@*J}Ur z35}Isf8>j8$YKwB(X%*Hus)<>nxAG{m*8w!A7K8Ugw)aMVZ8d#oDaP(+W5!*JYP+~ zyZxls`fV@vq|go!TQW3TpQjW1rM_8L`4I zbi36!0Jn4Oe06tY) ze}@)hgm*3K@2HyD>)z6avv{r4fK2OKtLiw2Cad>p0@`W2KTMPH)F+OHNz+gMIw)AM z_fwU~_#oe)vh=vVWK9XmPNs7?Eby(xj-e&+w{TuW^P?R-f;Ms=ZuiD>ndcTu`buH9 z&g3&W^NfLKqQt}b8TN%TgAa;6a`yEqomQ{Tlky*2-1JC^OB`G7qkb)14>Vu@K6+@? z=Eujd_w@rbHQzIC#+PWUaDv0!SY^%Ea^7p)M^=^8D?4r2V=Odo=oD)_pU7= zd#IKtrW(~BxmgfIi^AWo2EiFthpJ-6;zhDcLXDlbc-rEjCE`XD~)~RGU9V5n@Vh4D; z35wO6`W(i}kyb)7^Jd(vjd4xEYe!sj0cW3L;_@#QT~?YA^n_~A_R090j8cZLZ)s6p z)xxts6XB>1VaDrQ=&14PB+Kzv<}pOaTDHDa~=WQw%ZR~$n^xL*RXvKDUU-1;D;?qDV z3aWx4C3yMbf{ds{<-KI%)0|X-!_5n6hE$|YE`^>amI$5%UJrex_)>o|}I~(N1{#aaK+vHf?b6aWowCxoWZ9lB z#`5RSf_RJ$1^gcWhy$2@dnYRrLq#1Z3?~7;V_6Xy1>q9BVo;+n|LYXoUE8jXr)HLK zHgAKD>Dd`N+*?x4$IS^hEe`@l1X-OXR~-@-;K-bV%lx|zZUEv#@BA}oPna_$&tvr@ zgUQp+`m*0}>RlzCWd(wj($|Due5bie@V4(qnNhdoMDB^t%pH5t1&eaFbCV;^{v17+ zU}V&kf--2i;>@`bTp+9GLdRxbCkHOE>@VM4+%#`Po0$K~x8QSkU{lFk<+c7zLQrn|x=5Nhg_pHa7T2;roSH))ZNpWX z@5@zsr6(ot#ABo8m<@B#+v7B!+Kq~=&~G|^ov**J%}yzll( zh)f2){(?+^;65xVmcIlFaC8b+BRJxZA z>5iqlmRfpgzU%w`-ao#3&fUXa?%6vt&-BclM_A*fn4V0oMz^|lQbLj~nyS<1WC$%9 z6^3k1zd_3kb6npWcrA-P+F_!8w6iOgvg;(X-%Y@KcSHTWZFm(Mk~sP1+QzkBcM)`0 zbXx9lIFU8-FYmuM(W&}@lg_joCjOVi^emG3n0Ky>iec1d~awat4x&Dt`3 zlAjy}v%-=4~bE+s&n>B`BxJ4%BCEz#6AM=@^TJ(IZIT~!I=&Cu`fk5 z3%4=_yNJ7RH?$!(;&l7)z$C|vM3H`nGhN58AGSO{wcCDvZO0zVX!D^HsfIy!KY}-S zl3i!dzAQ+mwS0fWWC!av*R)10g6M~<8q%anAzWKlb#iW_I zc^E5%zdQqQBC){%Vjo|4B-F}^txpHDdrRP%m1YYRUZ=}m`rGZn(YxPU4SKUt5HhCq=7x}!=7yS0#9aCM15X){(xMA$ zcTSb~H>1rc>59qc;!*j}-Jj-4a=r#zoM%_7?g)N&{RFH0z=yk3o)Yo4d^@n_>wMr| z<`X2nH7-`YO}I)(wD`1QwmW-i*EB0Jp?(nM^}DcJSFupP4HLf=9kq*yj(l;@VY!Rl zT1F+oz@X<6na+hzbF)sa_tPQu&_*MFb`_u@`8fV^caC76LJG;r8<3a88xr)m5UJ|0 zrS`jTFXYVqrsSt?ZF6&&ZsIL8J+9SwwC36H5!nw1?@lp!Xe)UFXZ@4^osVVBr#m?HC#Qke=x&DAV zWp! z8ypN_d|!BxovUTKKI8|5?`M>>Sqs$v5W*2D~4^G=GIrx1)tRQVBbP1=HEaeR=G`ctJ3cMYk_Kn z9N>mo++B^VmUV^E#Ymwjb$3byW|^~@xtgS!bTM3hYSqspu;~Gx9_s-K*D(Q(@{CcM z;I2wgi7M#DwH(EDS+Y;Zc^^M0bBO;V`nhV{L~h~V)c4*+dilpMe24$t6pFj~UXHO~ zo!htc5Fw3&)8c{k9%HEq9Fk5uB_+>f^P2;Kf7g1Hf?(rK%4$8uFla%# z={1!+ePmy-5i6VF9BhHf8^pBom?_EXHcL^#Fji#45Yf*96EWMdws zUPL9&ZD+Gh38ct`aAjg+iw>HC1d();0RxOuCa9leKYCl8kaPp!$k~{WGS&eZxo^eQ zR-n>f7`-@VF%FSA=ca?Mr1Rtp;0YHy+kk}iLA3GNf(Jtvb1TK->zFd)XoXRG;=ehT zmG{3N9LlqX*AUe=!)~S+-PkC_PyH(b^(AXPNyTe3%qN>8KT8|XO}c(tkgW0)E!f7* zdVcFfh3pnTy}pCFEPwYfm9{lH8h|UW=o~ycyA0AsOf*vjLgzw=<+F74m5;AbK2lta z3D4gf@9biXhC0_u?j38R=CIk!o`+6}=YDaj=)=MA0ZW)PcxPQu`%%hN<1z2fKaPr4 z8@x!R3yAJ`iKm+Stl9y(;NzH~`d}WjD~W>NXtV3IQdeAB%b7^llXgD$xGsc!_Gm{% zu%ak;(9AZV2B3vm45P6@o7qE0YKq|_!O@*utMH|!ZvHQTfH=ol(gZ$YQ)M{EbYK%v zz^G$zMfRZ9FW{wcp@Wxsd-c=_IX=Pf3J~FSxQ4v&^uj4)T z!rFGy%tRO&KfHQYCj#rKDe<=CGEGyjC3!Q#vq&GWg!C%3RtXZ!g358kbj zjYfUi>gTDQKr|X%QvPwlTEyBlJw`5{*;v${;<(XF@%tgl=)o-CR zoL&9889G}n$-4m|*6Z(h>GaJzU*e??(^b<^J!~Nx^j&Jw*woZDhrM3q_j>r_(=VqK zzMMXrBcUxux=yR3u(Ciau8a~o+EcCBKa#c#n(`P<+t0gp$6AbptELgxx{*2|X;PxN zqCbe4vwNIA*Xt{Xc%KCYkrG2oP$sA>5AelBW_D8ZBjtJcKW^yLy8nBo(il)k)m1$= zHzMu@R=2S+$tttd^WUh>mqJ>P-@OcVqJfvHE|<`;&gKOotuM3d_5F>6#TBeMq|UNf z^J4LA81xqf1EM8Njp@Ww7}KVHRH>9>Ne>?cI&C*k8wh@r>ACulu`Fgr{7o9`HQXI>gueLo; zwFUD0z7+cHV!>l+W*W5!QwpJyY-Pxkr3uxC&B>2Y^`i77l?7KX4Le8>P62MLxAEt{ zJyH1vToj`_I`N;_yG~R!ImZ7GjJD`hlpZ>%gcnK5?(4ks=I<66n|7tQ6!AV>#P+@r z9R8%Zgp=Xzitlq*q_(5|nd(z?_Bs7nf?th1+vf%2W9|5J;~4Gy8|*+@1^g><%}Dr2 zPx;1{n4*iM!x{UQdf241c0LQ^Rat`e=hAzT^*DCz-^09(-i?BQufTi5kgEa2JytUN z0oW}gbd*%r0OCZ9gZN#ix8JiH{EV)?e^5!M-#@z?kr> z2VaKo)R7la5LkmI;6D z2nb)^d%9rqcQZ9g)vT^b}2m% zVCH~OxuipRmN8yiTSKjUd2`f231gq&eIQF*kxtt66m=y$QkY?pVyeku#{i=W>B-*B zj!>{A|8|r?>{v$a9~`|X@QsP}BJi%&E#ux-DB1d=l6DFxxZs5$ar&e{d{MJ_j&E~4 zcI$J_*OFq!ThcC2k~arl%R()dmO(+(J8~zlv5gFVQ$5(z4Bf(4iL#hu+3T)AiAOLz zA6qEYfBBcgh;-yc<~-rB{9>xZDK&B$S#hqs&S^P84W9b=I=9zAP(Fjr!xy0NeRz^K<-`nusF6 zd`LJt8+esB*6>L`g4lEp`dhM&@i8o%`-!u*kq)cPDU0fB2R*zP`S4QfZ&|8wT8#PL zrd&QM)94&ahCWmI1d(DryDx>%nF?O|^$rE7o<3M|-iLj84R~%`0o`nSrU!y0ZN{0` z>65;KX)d%L&o5i?{ClCq{m878x&~}pfV8oW$-OF$+Dm~; z|7tEQKPo6fJA}?k=g|eAw+wMoS@KK&i|QwSoaI;JIBC>BaJxNr4c%<@?we`f0?&;% zPwd|~%W?LjCY0OuIx4(J=k(J*%%0M)1Vv=Gf&+N+r` zZNxr>N>sd*&r3~(k>){Z4OhwPx#!Mz^yl! z+s0tX_zldhoV*1-zb)U0nwv4IYs&gG^wQNkZ+PkM^r`1*hj~GUQw5O_V0A^$vUps( z_1cKNHmWNHJqbIi*>m!O=Pylt=nXvJT@rE%4qgaKI2kbIY9r9Kgs}}=Y%@}%QQUL1 z&`!tym;UCL$gRMKv%xbq6+K|!SUtt~rIVfQMm<*csX z4?l!;zP_)cu~{UIvMSg8aob4>akQpP?5y@xn9Ysws~hRjCRB(OPsx#$WnH0y+>;abk%kGky3yu@~6jB zOTCIchkD~8)epsVWO@sfwI%oQ)?NX)@PbG2zA}BMIlK~hJ@mbWTc9QvC7mhoO;m}V zX;niS31$cM6-21^05QW@z!Gyg%##lylv)0Bocqh-cpD#WdT{nN{N~5TLivF~7-Gzf z!%(BWnxTYhL+3S71Np#5Dy{XmIV17R7WpA6Dm@Ow3SgrWBGI})QS=e~XvAOVWa#~j zhLRl+nyD2WbttD(xJ~ZvehvAA^GOdZ-9q1GM#)$U{rD~bNq?=C?JUulLGQP3G?fl9373ck!dy#G_8+wP)@0DLUjTYcoj< z)Cq2*m7mfBZ3|@~&-tnneVTfLOU7Cy`M)$_e9CoFsqfwGIW4iqXKa5@NQ6H~#KFc# zBfr#t_AJ}=x`CMwbBEu+^NN7ohwmh>lx*pIgg3+MN=e88l|Wjm@Rf1|A@!N)Y7)_W zU>7eoJ&D$%m4F>-SD~??3#Bic=lrVK22$68oNpQ9RFJb7*S=%Rb|S>$=kYYwX5@>r zA^~q5$WrS|x+7qzhbL;>Fnq()85JjMwU*pLOzGhg9KKP!vh@pltQ%WMoUYI&@-QjU zN7$9LbynXTCKi6oIOZfz&OprT=!+#EfD>T)NL>Wo#U1>pq(Etyzk5Bp4h?BF zxM|h$MC760$@=FP8O1zKO~bbs^TeVrBM0ZL#lziVVhH zwGHN+`=6#^@$p4c-CTQ}vW}NBM?JC30eogeaP{p$Q<<7foKbB0Y8PpL6K~mH(b{E+*`}5X5iGo*in5j`5oh*}W&Qlsh$8)3UtGz{*3YL%uH)TEwbpSu z0e{qG2HgIDTCMT7;L_zZ%|&kks&fr(n~b0Wt$Qx!%ToXL7^{<+d?z5(SasHixI7#g zi(F}{)4#S--J(mpQzGkx2mf@BSs5czR*y9%Bm{`;h)c}W>=Ifwuy{JsLErFNHx5R*JF$Q5sL+Gq0VpJ%SGfH4MHkJ+~4QL zxUKdI9-4b^>kD-io<^)Lj^p24T%$Uf7M&>28Tui+l8?sE{t`&S@2&`(Q*RDOvHw2r zR#?${GyoO#A|fnh8Qn9z*8WLH`FH6_c6|eocFvC)eq!l$cUA) zyr*{=$ibEwa8BYgtUov!;PRmO`|%LYm)w)h_FiJ0fv?kYv^#2X=+@@QBg^`t$edo% zT=|ear!Dv~X1s>LRLuyTOhKc_5D9YD9Jj3zj5hB4a{dcE5I@bldAuw!S9gPjUheQY zR@#(bGR$bOqq^V8gCFWeEqt%kxw_-x)%_hD)j)JI2+#)^tig~1cI#cD=!VPhm2{zw ztLK&!^uK{M=A{)!k?^MBjT@^}&aTsP4VJ!~zF)RB^u*#{0*M%e->XiD`q;|j^0VlQ zNM{d}hfTi-h$cyp*>ClZrqv%nEt+t{4n9g{{Ux{5+rUdSsv^BL5&n&!AK-K11D~DY zHyxHdxbDk*@$5@>?Vd*1^({Qcj%EyJ)R|#+mN92hl9*(#3&?p9iBv^Id7*?arqPT3 z9?6Rv(}$xn%4-Jo5F(NDZOeEAJ*mWQP06w?+1-^{1uwr?cC*u$-3gYTXD@qCG$m}& zL*QM8qA&Nv@)%8Fg+ybK-e^gb``)5$;Yq$mi>I6jsrY#(AumsuF<|ObcwYku;4lPG za|8J(!_wS&c;F(g{kjk9*iw31s zRlKhW(?lM+KEK7*IkwpO$Ozh+Nl&fHg_$3J8p4;FvrWUH6$p&dZwAxdE_&GCOU!xj z7nppkH+~b>e&y_jA^;LwVZpcuBBtTs>P1(!M;HrkPZ_-u{Tl~V*aNLJBsGjYw@+%Q zL?}<5I%ZybCn8M+g6f~41%o`4(a!@0{DD>ZRN`Ong2%uV6+vNI_Y_#2HrA-w?@hp4 z?upATcHFTxZ<0gO4LgZ5jX0^gsoPQlHYw$Qsd&E@q3pnJksB?f3C}&{vsRe1MY&S;M})J5?qFJ$sl z%I#HkHE*tqY@&&@KYX_7_(Z#06}thY@}h2EwqvE}BpqfcB&&E0#HDR950Yb#>Br_k zws{&NOvmq?@LDe+p4hF}hjhXwPHs;+pqZuUe}UGUhObv1_AFkF0SB`!ar&tjyFXc2 z%kNS%Xb}#c!>~gHL)t`=kI5HL*9+NyL7t?z;Lp*g7G7c;$5 z!}C1WMX$&Z20OYLOo-RXW52U#!Y;D8oGXtk#xDOoj{V{z;02X9W1PK5-{&c&6^<5X zS$#*Nh`GTc0jI6}Lw*DO+ntFtAVD5pUgzKK{s1ZHbm_tw#nPqvfy+lc$Lkr$({%v(SvJ@+}?_m+z&oa z9qyO)Y1#7j`MhsHzOlund)>W%)e<@ASwq_5f!NawygAUTpvivD`Yv0K2Pmj}Fla-b zkRaLqG=9KN-R8(jjtl&@Z9Q=J+uiN>K5jER;4yF5O;HUF0B^4t9mLT*IB?Y6S>Y!vA5j$J)Y!_M*Z z+R^9nji2(AKQOc!5UKc|b#yPvHz|CnkXJ1U`rQnE)}glSshtkwCi)-HwH^kgE2m3- zsmOS`2d>mzQWeRKVGu7`U@9Ex+mlyT&3C03u4XO1ZsipJ>jmf*z|5GbdOT_jFqt~! zav5l!@GVkpCWx7o4s62=nxIf&A^|fx_v%j-B~J8wd8-U9KP*bfk;345t@iL( zqb0Po@%&-)WsR&M_Zc_0k0r@3N19%}d^d;1z>yN4N!0?kq9~8@`4A-;=JA0CD~aGd z5y>hKr*W^}!vWEFdxkvsww?4L)tVW-o(Typ+>CHb!g zZqe+hiIrcTU^#Dvbd3!>`vtJljX=TH4{9E23428f~@I*@_ISgqtD?YCzycEn57R+fOy5)*9HLplluR)cikQ;e>R9F?0p{wsTL3 zLf?>2^)fhZi#JGJ>3BH-lT>6}Ztb!^*%Rtb%nd$2H-3#MOWtLzk5D4lqK(IrYc*g` z?5Fx!rbHMu2P&aEE2SLw5iH5`IDEy6hWD#mPoZakyi%)(eIf9Rk-EyrZCgX9(j_hH zt($=w&B=Uau(4#Y`5#4TAM-YNUr2V>&b-pQg!24)19O)ie_G-Z^Kyri7DzCRcxT55 zbQ-g%`Z=oj774Ghzc(&$818UczUxjJ3fvPV%2@d8BHA2*^1fmJkBl`T^t(kbx9raO z5j>dT-9cnw_AjVpUUqbuUYB9GuKqnyxow-U#Tw`tfYBfBTe0Wt)5q zFS-8*V6p7Sp4nB{AHHtziKdlxhp7{{yHjlPx_R|p9lsVJG1)4li2?eIsF2=`p@TQU z`%vr1pUrZsFZW0 z&qXb!-dL5)Z8!V;9@H*?KrZ3v$JXapkrkjH(NBUAjEV2`rBbKAfy+Y{`m4cIyprkX zRwUzZLY=j&@wGb1czHI;DRx-tjO=_!1i21Nu4|4)1c#T4q84BZnXbficb)#O$8)Hx zBqhQ?j|0u+)eiF`^CdTqyFYe5#F?JM{GRJN!>i@+S_iXVWVKk%Y8 zss2}us+lfKJ1jFDn;a{HO%3$T@m`Z&m0m!?u%j*9ELF-C-ZULR%z8;Y)?pNjoeT_p z*Dl~V{jrX~hFDtQ&L|&Ow>V8iY64W!7~^>7y;HqNwfi2d>I#5ce zQSvharuH-^Orc}9Jztu%07LSx0ZTb+{laoAXzU4OID6)832ikNS-tZF;okQ|kgnzl zYBAA%pvA+^#i%-LIxc30P^h-gVw<7q`*WkOIx%|OTE_E zZrVhLRrb73&xxP1d;60(x>JZ&EXWW482?M)HX{Xp-O^BIDxIQZv!S_vHHKJ0DWyB5 z6C0KPldr%k%koep#MgFw74WOMq_1#JCdrS^fHGRJwUAW|qv7lRNR2YL)ExeHoAiI! z{qE_XPBXCIxET|ip1=R{BH71?I z=eQLk-;fur8S5}{Qz)=3w;|$B&5IZ4f>ClzKJI0ZOqb_Z3)_^?PATz}Rfy>hXE1c= z#xzIG{hhf63XSku`}1aiAfjDP6>dVV&Q$+o$-|+BP7#^-1dW=f9*Mh$m?!4>JA|J-piurC_qVL zlG1}z!DJLy18FcX`;a zTpx6+iC)mN->uiKB3n)g8+X@;ZtekAkA8uOUvjY>Gz5A3wvy_y_by zv{|++_yx%5;j*H!87GghI`lRgy(zpk@5EDC3>V<}btfvB^^4nXQ7BnmFZQI?y z(&yso)r`SCx!2VeyO<)5P6t`0Ylt_pTxOfjdqw3cy=G5(S=_QLO5iO!WT{-a!aS2c>E3BD{W& z1q(%Lh5TYT0)aF?Ck31e&CmgDg~_=;DMK$K18_0Q1k~>L=*Frf14)oasjw=&b>FOlW;d=Cn{!e z^QU|JL|Ifm^Ri23TTRr(a(s)@cl3BW4|dw6EGq7Ua*7%gy{PX-)^hk{c%xCCG0o>x z%47Ezz=zKzer8U8=A{W~u2zuSRg->&E;QYMRuZZ~+Lg$P<5e_;G!+UKmY(R$Jo1ok zrijgHc#lhuvk3z6KY7I<%qK3g7dQVbmV*5GocmWI-o6^obE1%KD+xq7riTQ0r2TFL z`*%++b{DQBwCthI(M*A*X>rt-vW(?<@SNjqITW$Tb0C6nSoM;0MiL}OLb6|Y4-+ux zKH7FzRXram?GmW*sYbyP%}y^1L?v3Tlv_R+Tmb0C42wvDd?)K5U!_~ld7{SbM9;9V z3RiP{#DXs?*5%(8g}&NY9;SlH)P&=;djTRNafYLK-Vd-Q=aJY4D56Q__3ZvfhRp)7RFd0X3ZihoKZa{r(guEhFv!8zgNB9Xi;dja|KNS7$Be((B&h&j>L zWV5La$X7B@PBz$39(<-oU1kxeH;py&_pZk4yeQJUUI0QOJWbW$i>Y>X&@4XgH10ww zIhGh)f)$?f=Ix)PUrOyQQj;UlQxm&w%tw2V^;#cUpH!pQrOqOI5@%nEoa|?-t;r+Y zwm&KcL_&~@2Co{;xi~IsGB1*0r|YO2R$&4e0T9&+%I6Mm_BxP5{_Ct3JG3-yMeZ|L zg-eQS!4b~UTaV3O`%_>i&zn5QXkIlGY1!1{j03VKwA4O&9#iyDTwZc;0i?#iq()P= z{X%zInFSLojbn-Wvh$l&TUw;?R#D7mA?mT-2j$2jTH+K%^4YMxaR?)4>m@0Z{d~i) zx4Jq9@#q@~#Hc?YJR<>CsG`m$>uUfD9C(VH+&h8hmoVe6MCBiKs$jMn(=NcQA&haw z53jGA>@B4Yu1ZB@DixBEv>^MSo1L|&(Iu}{a{{h;cU!?p8x=1(rLOYn_S-SyUMB{< zk~dQ0^vBq~xUU#!0&W38?Ny)kgDvvDqWF$66!k`3U0niP&eFbargkw80PNeQ5zPLR zX|krCik}SD3fk%iK$QV*5jzL2;|vo3cYHozZ?8r_u$VBXt#3Eh2&pU7Pa&UhOgZVH z$3%!3=)NaOkn(Zrco<5F;iO3125} z#jw>UWk^C_{xBDB*iag_!U7qRj$zCI43J@636J54$0e}${-=8QKLG?Kl7872fVZFD z`lhY7VN#J5pgR$V-CDX-8mA_wGnZqyboxJagjdqU)T)TPzDRcY!h4q$!uZPlN#_}B z_w@B|y;rTU(2w|BoKwzOe}hG!-)XNOo8)8JXWZNl`-s3GF__|y+UwtHMIPYpo#r~=_@CTV+u%zyS<{0H@wJ9oP^S_Quk%{AD46PVt_i! z$0OLx(i=$}hl6ZU@Um$p$rfLMO$%^ZliE{annCmiZkHF#_}P6+uep5P`Q7;l^moT^ zW?QnN>4XPSL6!+ziTotsX`600t4^4*3J1@x^h6cTOwS!Mb00GhC|&3*xtm~ACv1g0 z4as%gNCE%DoWvZ7CK+FQk>}v?#-r&)Yd-?C_dfV-x*QjOY+Ar)t`t#DZP%|Fcg*TS z%EYG5>FFdUA|BiU@JsXv@boC|zv7deTvrxR|pUj13^0``g`x#a@Hpc!1QT{l~m9VL#2@JReUN za{eG$P4C1BA;Gfegkac&cWJ#(5D=K2Z2Odb1^1|MYh0fAECIG(d~kHuHv+9HWCweOl4E!5n&5!AXnfo1-om2=JM^w> zfBuah>VzadINuX2=v6?(hQ8Kl&`}*Q-kKZMT`<2hl{|*A2<>=-riB5HWTu37I3!{} zEiNu*4B>{$zk^^%5WhO4suZ+lW$%`o*Lw?G;8It4n1%-zpp<`mfH7L`=|UE9e|>G( zUE0LNM=!7&Z!^@jxBRSjj_IoxMVIsF7lElfswP2$1#LnQWu&q}L+Ky7zctbi(Ckc&IL2Fs+nCZH06>=K`4_*61%+(q zW#L30CBEb4?H7&MKIIhPSB<$}&_Gr($MVDXr# zn6ZZIeF~;m^FJx`*xU0EIiF5EM0bzq(gJLz-&XCyLobkQWhcn-^3lcwYSe`)TO1QB zo{290z&ZI3VWI%2gDicUM|)&|E%}Y!?P86Byr)&V( z+v?6hT{MYvrFR{vQ}8;WAEg7P->y`K`}8{p`)A=(Vgv&qJF*k$eZaYBmZv7r`(R+^ zSfRW|B6Yy(*X1qQ?~!@_Y;LrVdn&Xi<^2;7=L^-sgq9qxiad!!+f`jwCJ%+FhH?H~ z%LT23AGDsdw{WJDy`2Pq)N*K&;*cpBaPsK&0Kg1${V}yg= z88-`>5-g=B0u~8-{%c#(SamJ(Q&b%FiXI7PrML(8Rn7c%!rzVTI=ekO5GOTDO5RJ` zu4=qFHbN)!KME=w3xqB#e}}_El`y8A|B23J-w1YB4}1zy4_z~@{$8aE2B8K4 zxwXJ>;0Uu9;p9i2I{|kX)8kec-!?|A9At1!e8NP~@dHqf1SfOm;>ag&KDMS3E-y@j zOz?@nKZDfqaS`i3I+j$0Z1L{_iy?b(>K*e2>QOUKzN$c$B&;3Uh>j1ct zv?$SER+#!x+^gFGNqd$I{PKB^@irwB+?6Y_DSw1|*!S-#gsmg%;%7f(ap&uG(u`PP zI-h9p$>LMinkPuqdr07aI_Dk|~Z$xU3`5!1o(mpCgN?j`> z*x})$@b(XX|NTYM*=#LL{QM=S)O0vQM^op&Ye^k|-7}K@+#_0`TV>m?T-wX@Hcv4m zF}sPM#BwciYd5(}X`*gwuoVhwtsi|-{ew}XVSer0IbqlH)hv6(S?3g=QNwt<=!5?Q z!kE$BxnFP0*txfL=JTfgHfF0dKm^~I?^KXy=Cw0}@Q}wTm6q2c}bQh}`@JT0ucw zGE>f9DBOX4({^t>ta}}2p^E|!*IUm?7^U(B@Q^2hoJF%q96PnQ^Q9l{TiZ73(y2RE zaNUn5MzG0SU0einz^1LU%aue|oMt@zqW~e|IX`)tZVSvNNio$E7sdZIY3OY#&|=_g zI!$`V#d#}rmdt<2!e{`Z#1~4*E8P{!?5t`M&Xj~qh3p7qE+qY&=-Q@y1EcX1m=-B6 zZcrS*?I4MbCLACnFiT4SXbhsl$h@Xbi?#fY{+0fp?`r^Yq#ripzk0aIhFk}}0FQP^ zEsWM$WGulK7}xMKeyeDdf>W?X#Ng}3&BO$#X;8=5%YflHdl4rhKjZn7fGX$M?#9#k zbP?1vUB9x6ll&5qf*+*Yf%W!{0AVoV95IYz zX0A~9^^>?z+Av-0@etp><+tBo7%cSZ<{+J6w<{k={6cwgD9Qv*#`GK(p}Cxpaa~P? zf_$?swijjM9D6S98ki6_?Lml$=#M+*v-x)m=X+>@A=SOq+qzXdpDWcOsmrPeJ4^gl ziX+Ugq+=|cQ*%m3GMaoj&4oBt{=*{MFFK1No_Geq-QxdJ&0tMEz~uhtoEG#0Kvr?R z>8g&Co!OK$b*cA!3azf#x^MrJok8(8fF6l9W3{QkKGsyKe7ls_uLl0ZW~)&I zl#dTQ(!2*iT`}N!idhvYGsuM_={@E8E>6I&eXJk?PG}_HKQM-$UwcqwhTuNQkBZmb z!rL@N?~qJ7=NpHLxDVlJIyWOk=^Bql9|aSD-s5lf<3RSOqT+dkyP8Z?*!$8m0vt1? zI;UeeH#C#TPsYwi=2+7z_dayh1`_*zY`UHmA=H*qd>n*!c+!mcyZ*?(v|h^PD#eTQ<{ zCc9sVee1EhGW8k*w0pAPa+hX1e~HJ>BxQ~0Y?K7oQw&_@W(`?9XX4z5P2a&&(4&k$ z`6%kQ@B{Uj~SNoO-aY= znlgGmPmT+)utY`kYmF@cTb8D@xOo=GVuE^-IcP@==x(Xp(VJ-XD*14`P_EZb+13>* zH2YPCyF1ef0*hV2g^AcYLrgE(KJq@BEAS$ovs;u23&b#dZAhvLl5PWZI{f932RH zn?mnmj0xGkA!B)7A8Z-q2?e=3pxS5}py&d~+K}>g(;8~j(?Og|x@$B|s6X%rKXT#* zG8AifJW;fztjzO9t?Au!J@d~;s0_yh0gxKz|H;C?=dbr;d+T$)WXj>wC&qfHy$la5{IM4w_JruZ`u&-XVRZs9KBN1zV`ZM977X6DGidE z?-@*f^_DAheO-&IU>4^^S6BlICjl(Te*px6!eQAzGc3oA@;G42j}{bRhbj^$Z^CvW z2$>($dB0n~EnrKen}2?FNXu5Tn2qxpvB9oKkM8V%9KkZP{{c8Ca*bQBP-&D1BIw$O z^C8a{s30fj*VVq>=mNPBXIYw#vL)j97p|*0DwU`eeoGhGpEdK+Klbbz(e0NGSQRG5PvU6 z1fFo@xdn({nH5W5Z*B(ekkOOLYH_*P4LM%y{)qlZLYTqLKV4I>-3}JP{!T;C{tv{> zeJhCPu2+NG)-#wDLs+|ur#@+q6`22BEad#jqz>ZU30LQmnleuW0Ji2aSj^Jzu0=$;q5L?Jsb+T_@YCfEIOLelM_y90a#%zh+>a+In1$_W{btWYgC98I(QEx2bEUA-2GqB)*eX7;dCVNM4L%+_WuX@JMQDaT}5_q z2M>3J)Dn=+`R`l+rn*s)Z)Y=|`5Vo8zlhnb)^C%sK-jen37BWx{D#X^F-^H`96s(* z38GCJ_K}6yshgsB)!vP=k;X_zg?L z7(*eJeI!t{_@8vO@;a5*1tm}Y@pS5@dTQiU)FM!yCB+%#)m?%wUbpx5_b%zGR<}rD zXi0ALFNCTII@@whyMUa;>3Hg+fZOh?`d|(KW^rAdUk>-{##e`%f~R-EcH`+$cBC;x zE%+iKqe@}R?y4gL3>hM5IYnjKlNY+z>lPfi>(Fb{O1*EXwWU1ca=&2=pByqBk5x)* zh8GSTVt+X9@oEpS^M2m{fx84W%+2ca9dP?&whW{bZ z`ifa_f4K|WPiz~P9eBw+n`mU^dC-VR@mj01`;EM0pVQrO zr^=qK_r4ePl11N-2SZlyGqV+1j^7L4^hZ(QU^|CiGr4Rxp_g)Z=^8&0Q4obN^Y^VS z5c70=AME-zoG>S9C8ocb(Y>@5sJrPJK)UNcIq`lteZ|5>g_r|>VG#AmX{vi^a=jV- zO_0=!IIk{cUWLOa|M!{ig%O5fl`cbe0T9(bZhj(p1{lfzi7IF)1(u%8*Rcx?qF;P7 zB;}HVHy4=l`<6r{&6;a`0p{2A4Y{GFSD+L+ly;P_pyxbzeI{9T(Mxl6aXSY=_q}sp z2g-3BEjRD$6~KE+tzV8u|Lj6;{cDj|!FItf8HjXYNX4Yc14uTryHzcJ3=1=#pXb3v zg2Nkfk&$9HvY%F5dK{_v82XY;aj*E;LYB)j+}l5!doso0P=s~U6|ajPH-ji?I7mhr zNNyKfflRD|y1KBM`sCKbq*{wE!Kh9MQUs&h=@tca?yugh%Oa z2&3UwI{i(Ff+V~rsVnsgUxYm!hZ7>(^eJlAyeiiq89hrPSyA^p!VQ-kOSy23k{F*d zPIs)iPMO-0QL9p);JfkNr7R*5SGa>#fsAL<&!=oX^`;jC0cY%CJz0NribWbP_;aLA z1kTKb+nv99&6eb`UGwMg59$`yUy8`K%ppl;;coS2wHDuGV{=kLu^!#}Ce>K8g(4HW70v)y?rJ^^uM8 zyu|yrSkWH1k!LomIXVa=;O-@eTy1+Xg2|e^gcnzTEbIE@=k5w%mmMN>3Cw_@)%Yr~ zUi}htH|a0)3ZD8tym`hV`#F0L6IIxdZW))0o2mxIyq-;v^#VNA#6hhJD>hSU3{Llq zm)RPj+eKOUS}_Ho+t`e=bajOPMF<319vG=SeRmbR!Ob-GBMvP3yIGZP;o!uKs@hIV z0@CJ@!<#u_%}^)B)cBieSJ0^?5pnYDQn@^WYw9Ns*le-i6ukvO^<6_w44TEz`uD!A zr}aMfgiUv|_X?#g=XS`PC~tA3Qt0-CK5seuXtFJT>q(}mMuT&{g84=JG`kRbw3?>t zV)hAp+DiL|&AyB6L27u4m3ciR+-j>~GN?kJPE8M??Oc-T#0ui%24Z}<>OyZJ2%FWR zuKf(w|FF>cPCUW$y`k_s)thiKVy$QE{8Wu|V;X_{H( z((PzU5cu%~WjrXSI3T6xvZXh(gu2 zLDjdF|6;8E2TJVA67M6Z@lk^CGHk}K(UfY;D);Y>tv^LK78I8Fb@_0t)N4-y zu_LS$xFMB_XUEQaHl{*uh-ELLUE5D2vM>E&eJ}UP;`#{!@Cl(xZe54>`O&ymMlu3(5&01Tg0=O&@dB@>A5`zs+?dkNoaq~4As7BUsNpQL9 zvh=-`xf0jG`4RgZOp(X=v665!YvkpHLGW9afBE{?+t0+#NC`mQ&wIjnKp?ev!Nn~T zO%+EqzByh$ynO!Vs1N@YJ(RG~<`D@S@{z08Tg^o^YjliMZuzKKh``*&us6~+yU134 zTst>_e^E&yQSYx=2@*A^X1zUB?OD_U7qY2Z*ZR87C@#;!gs_Y+C}b6DU} zVpokEXyXarSFX0~78^f|0lpc6;-_3y*-lcu>@bK8SQKF&TRkvbwv`NovzkSRf`X}J5 zHJOEJA|cf*pBUkalQyW9`?on@V_iio?H=?dTRsJ`(MpF7(lH`}u@Rcv4*e-odZKoI@C zv;rFE+w;<+3|ZWu?zFHSU~zH%PRmAoXQ^|J5h=Pe(hjBk$qxOaV17sb_x6mr^W<7e zX7I(s0zvq-d1(U4+`uv4w!*0ZVZg(EOQl{OxryiqW%N9C_Q+Pg>>2Yy;8nnW{vA8` z(3RxL)&BLZ-~*J?F79RAh?Jel#t+qZndHxY^3YJ_)y8`)v$u>qNb*PTE=M;MU8Xji zuiqyhbfh`_?~psmKoEk}CM9KfUQA3@T*q(jrZD5hU{miBkTz1UV_&k}O`)cD%p%0~vb#O3gq5{9dAN|A2AS;7@&wZ(!~L_)bnc^+NfGDhulFVvDo??_Vl}z7ccc%# zh7{f+X71`m7+2!Qop$KQ_ec2dA364Fg9`6+@%~@b1Hp1>&b9rXTi+H5tl!+~?Ll#) zIH?yU=NiAwH1yn8kIj<^HH&tS*(sl)TS%h7rb7*J`dyWXg;4yfi_OJOBCRXN77vWe z#kKEE7_E9=99yDj7t6T>+hwfsbEt<{Qs|iFQTVvsA7V7F_Pm71Rk*OfBu0+Jbw54r z|sJy7bVN)YO05FZOQV)wpODP=cy}1OL_Ec!`$g0i+&y z%@#|GW6Vo1F;Ms29-ObNVxX^m+p7+?dmj|~XI16I?+x=K2|a&^t(W9Q z09*pBqSpiU73wNTs(!M6xCok z82_Z8G5Igv{k&&6d)?JA@)v{2iM+P$P2%gf(jge#vb2{rQ z{0Zf+o1PGQB#_Mh?s6#0H5mOMV=18kSy*3! zT*PzJbvlJOG)peT9otFVOdZ~;eqixM+x^Zzj?YXFnkFoJV`G%)YqzhC!0AW8J-Rp5?6H1UO%f=GWRFO?2qk!hk35FgM&e0p@VsfTjsr0BM$u< zfkv^tOqZW8)7*- zB?nZ=8}r`Zy^uPWM~YQbGWMrzRxWb${}v5*UDb^$4l(*?%~n3Ht7wnM!h;t@F`hZ| zS?acJ%Dr~~Oe3$vL+~7D&PDF$Z}7@KD>`J8O)jx$2gQocJjp`^2RE^)3X{{#JDT#X zrka~@1@4RR`hy%UT8tQ1k<%2KlbHd8Bmj zE$9uaVs+*}Ff|`tP+${a7f+XGQ~U5~+<8e?-m}FEqv=m}J?JV`u=k-6)=jaq`gEGG zGI3w{KITWdROq=fRA!*7U4tZg+vymU87kj|3ayhtq`zb^-8_`8p5Ihs)eo0U;u#`3 z=dnd6rxS-g^Qr_d2zm=F&|goM~Pg=LNnn_xXF?{rr$UO5!4^Tu`FK?muf@E-*@(^2HT z*Q@wJxLzG;7(YSs*Tfvb!81MkSmL;C(bNKfLPQ4(3ow9100P}v2Ov44Zk+FX zci*w%st&tsmD(C3&5wqT`n?rd6K1ZtwTr4qqpD!$2fy%qr^|om7~XwunZ(EKpLe#r zX2zv@&gUQeX?*9>cl}B>j)7%DY0o>IHQQb37<{n`>uF(1>N(A%)cn|;Q0(| z_W81(saLF1lfQV*N2QLmJt#Mk7k`$qrKH>&Vq+k1GQG&po=IetsILJ$1PbeUw1dOx zNIoYYl8}=82SvRBg$JaMh5F(WgNC?iq$A6MAKnk%XedvASm#J7SK^bvBhc^cq(A=C z)ooSRus0GWF~TjVzK5PnqT9(Y4nYf`z%1YM32Lr?iolPG1S*=mD*apSb$ zv!KXmx0=(e!M^8t66OPtE4-U|5nlG}CCe=fJ~a2qHAARcNQl7QO072=_LONPh`CuN zh`rrC%(Ru9_M2&TUoeebxD<7*vRF4=`G)+-{hbNgAJ}6X;rGQ}!2-I0s!L#T7#32{ zxugNd^Q(Iq#fHZK{duY@EWV5%QtmO+KXn&>906a}|5!-?dM0LdeT@Rxai42t|GDZN zaP_y}d~DR+&?E;?&9+Cqy#$jrkdK9Ht@WPRZ8V#~$6!bafLzXBBdlnxx^q$fESDuJ z6|MY)n-0s)VyeMY+7z?1dtA_j#)=xAI=>V4TW;1_m{{l%@8$T(A9QflRY2S%Yw+;(ha32XYyF5CUln;j1^qlDB~c$YKR+S_I6ZyzMIi z3bUUl^A6ISU1|q`q6e;;C_0NgxjZxilsYN2Mp2%hTRMW_K1?KWEgPo64eis3NA;+5 zOaBt`92c{=O{N#N*@wikZ@D%~T~zkGrJu<=_UeQR6-kC3N~>u*x}$%wj91_mzjJUD z9h;NX@p1KWjv0lFCP!C<@99VmDp;+biYUCh79TZSRb?AheHZX3A_ye_b>EqXf>Q#w z=zY~A;%H#UyIvdrxt%sVgY35)2IL_2wc}L-8P(#JTw^zX2t+LsR9^w^(-N{xUF85< zz|&nWNpFMR+KntOBt`mBQxunO8$Ldd@BxKESAj@n^pEdI`Ol-l2I_ARt_L~2H9Jpw zu6Hz8r8|pdrV*G`nw4 ziCdyoJW9#f8lU>MQ{>qs2C(?HcEBW9j_jo0I|kmU^Cu22(93t#;T|sLi_wF+!4#H? zr~mHNjUHdd^MSauT!y4?r~@yH%ohRFBha(^1AN8Q>bS*o_4l_dK`*UG78jdOZ2_9D zGK9a9wU`dFN+xXxNjsrjPERwX8Q1p=V_>LnoxywOkStx9A49(=bZtgIs!?~ZCTWvd z3{x2HLz@KI!8K8SNgD`R_BYV01X=c*r2_F#nA7{V0jfT4u2!$lJM`3;p#1XT3+7jh#picrMg;G?l$B_w231qxC}R{_48X5g|&m{>qc+49dJ_ z4T2cB`ezfRo@c~usps2&MPwGu6#M-y&IC~GFTL>GZev%O`#c_RZF7t*{hqKN2YD@r zYlK(EM>#+P&`IezOA}5#l2uO^O1}4_*WBq|L^keBrq&|Y^J!Xy@>|N2rBm6(aw$Zv zN%6xMHt5%P509kXUEitY-S6Ieqo=0;5g<1meC&+m_z4gmMtiKm)}qR1?Q-95gWLzC z#&9}p8-y>jZi8MA?7rdd^`)hJfk5E_wsq><50pSlA4Jn}ySdwVyV}OQg1y1jz^JP+ z3{~@kGlMST@Up?JZ$E(3t+??CZ_Y8-sei)lN}n#JG3oxagY{ua+$Jh?9T`i`6}8cqOu`RsImuc+zSiYF77Hzr%DGrAy- zqc4S->m5?#t1!@(HBf*U|6kRyL0YY9PR#Vqo%TT93=+G5CwWhc0^HY!&uF(4t5QoI z`?HK3?nG~*d_!LYrXr-Gx1g(mp&G;ISK*(s2~RnIc^yw$B(s~iH=YTI|3R_<^MLSY zc)NQCYUOXKzr^~Wnl#`1A*L~b?|SK2q^?M$dk9G7FFc+c#jkvLv>o)qxAL`JAd}%Q zxS>Q8X!r4Q3N|=ngX5?912A5h8ug(Ja8Zv&93_P{2t+gh{u5*~%sxK-PCJ|wAi}7v z%>@E0^rLkw0#)&7yC{dWKIyHuk*GiV6cserRHdeC{_AI@f+VkF5!o6mk#Qm6aXEdF zm3i|fGk%#;@aTM@D=69Lb25@;JUh4jUG(OktKD`-YQjCf08YAD9dnZWr0|(+m#2~F z=ZD3K0uE3o9r-6`qc$`UaJ%Q+=oGm=_^N@Ic}0yd45d_(`23tF zseW1Z){HcljPjOf<66pTO`H%M)67F4cL!u4c)IVJ$CQJA7YkUjG!OVr6yT@(U>5Ff zx8Ua|9=+a{UaH)J4lpP+$G&9Qlu{iCF%pm8Utg+$ zhrk*wL{~P?Ap4E?e`69=!#)|qo3t{|Mptx28MlH>Fv^7J^xZ4Q!}AaoOIddF?meMH zWfk&9)-Tq(bXbVwe}5umZCQVVKtjD?Co?zhb2eIqc`^5d{sjOafeZk+`P~$1*ttMk zrKV?srsCE3u}}h~$`1cV7*DZ*l`m5Wli=c9!KSwU*i$K^0o|33?N|5r*&h$otoJ5> z6)qaFhv!!}VyA89uoS%LVm|Q8_9x;k{}<%mzEO9h$)w8K+g^Xq@YK_Oq`>R@f3$Q3 zTE-1?!L2LF$sK$f&|94{m7X^~lkqgWLqW{hdp>`Mr{}%+E0KHNm>}HRe0#n$1T`dF$p%#TE-~> zyRtIoCX$88`8XsAiruySG^()Jm?k@u=QCKaO+5=i308sls!{kz_?n*D4K`N?2j))w z;J$X=_Auc=P`+y2GYWz;?zdK~qMzK`s4?Gqxerz2-}7!FMXNq|TO6Y=tR&004T7BB zOa7W82^5RTOkZjGsC>QWA#cv~@9~TO_xM5H#0u#j{@r2XQ)A}eLF%o**aNpIpa;8M z@9Vk#N736A)agEzJ3QT9b-rV62QT9grft4Cqza}aDLyZPYR7FKQ6pQHhMriAE1EPv zFBK-fE0w()t$MYZ+pZiJ*pvYsl)Z(4?fj%CT{(PagY(_0;XrHW_<7c)=4*Qnw$U^; z6zBF?A*Gr7u@VDZv13xH*>Urp=DnN(mIiBwZx|z<^&hli;%T2l9W1qV3ZkuTqf<=#^&IPh9+1OMm=;L@E1S zv`HA<3-{Cjnpx?xmXOZ&;8f<_Fx9Jkmdh81ziFS6aZr~8j|ju-I)-K{r86LLaBQH^ z@$kmgvSny;u0S8Yl|ShdWpB&G?KYoLs7FYNV+wpCqEvaNF>?RXU;3VdiAXB?`84Ls z0j%Fc5*EpV%bQK9T?GaK0vy;kKsB7~A9MAjVD7UNiXdYNQwRz>wvh)97TFVLC9-X= zGrU6F0;LfO0O`M`&(<8i1c(lFwCBA-6Kw|lQ_O)f)C;9{+#johX%|j=JR^2CAC_ff z=MudR)rAj@q*Gnj#O{@1Owb-I;JO!<%bfWToQRuubN( zz?`62?oA}c*|7g|r+?KK<9Ujm4%&o@`v`Nf|KkGKf2)=nRzvhQ?4^pYRWSO~Ev)vu z-?v`0WY;O$vCh>$dJctdq-mxfw1mMfJV^c!-lid>}rpPL7CKRNL`M#D2Zdu%jK5NTM%%ep5PY$76ZrDzm;hWJ0VO zvouY99qaX6)yu2t-eQmt?9QuC`z+^Fi^DurWmuvb6m5SnN(m}86eB}@j-In|ZJEUu z6t8c7o1f~`#V;pfP1aKLy-GGNppS{X{X;5nd@=jyAi0ovipg7}!1_D}60Rrg87io` z31BCZn)Y$swWOX;0EOwLeHj&;l0(Zdjz=s2{~vRj1Zvvs6}xnvqMqcrJun?~;8jym zDWaItbilbHgC1&`;wBmlqskWiQ>z4~=MWpY0>a#)FN`F9baEpk#2d=bvSN-Mg(j0l zLv_J{y;99rY}xaE+|*+~znlEl#VPxFhonn3rGIGqvC5xzPV@5%$#9CQY1}U(LNsi5 z{)O9M-fM*4eAA2b(n|iAled$x^JZ}v*tdRv=CWii+U&TC-&%_W`S-&gY-ZHZ%j&L+wPs{W7o z6{6O(#yVOZeIg z#DscF8bei`$>_Nkh8E<1o2#{%a)tc-3}flZRUarYcVu$fxH`0Iwrxe-vXx@Lw^8c0 zT4X#v!rxaLaC_Xph{6rQABlSett9|)q!paZ0}6<+hv!!=E!E_7Cs7geUZC#Sh|s4+ zUP_1wh*vXzUI4{J?*F0#M|wtDoYVeip&d?69L>~K?Cr~vQ-l-C$FiVrh@HLWi3Ydb z-&>&YZkTEeAue5A$OODE}s`U}wDbhy{V6H|0 zQNiGI1;rFwA;7)-)n{qW-h9f;Cd`Iv9Qz^3Nmp+ymv5vqQk%8%R<6jV;wbBI#K>u1 zbs&KrDg55FaY9Q#i*L$B8kuSYcl0~>fXT=@*$b=^B_K1T_2sG-I9|_j)@o5OKwl}p z*WVMRgEbVp#Gs|_C{D90c!j8?(8E{s_@dg98_>PJo=8dB7Ah;l+K|k9s^?3$p>u6S z;>({>_i(y{Qqpu<0@L5`c0CEJ4Y>sp0lZ}5|8Dd4v_&o5>AUXrPmP=5fE4mNB9yzx zM-*YLfCV_=NAV8|oP`a`I}f)@fhjX#H#6h0$EYI_rK-m9X(5 z-IS*9u4+0B)dP#(7UpCwZ25G9?*ewC%$LQ|F_`cV~xplZ&4-(&=pm6q~eCA@k^u|)1bQq_SJ zp5%|X>u|4g9Mdjt(xwy4`E4;%6aG=VT_y05JgdN3nK8A!E#AU^(ZLvFqAAbkCM+9( zDE0IlaSMGJheQZd&efQBJqrE;Ihl8l}$O$j_JwSFH)+H_x-p8 zBeaE^9;mWcnXdmd`Xk@T`%zL=44rq$-dD|czXfw7?b!7yEY!!QKwY}DfZJyZc?)DT zQ?#`}tNi?jvdXWDA|1wN)>3ZOfEUqB`J7@5g?B@+~-dH(GEcQHNM;2g_QjPowh88wZQpxODE8h1$p z#x~yhTgoiHjrwe?{(c|4PU_Wac^UWk^>3sgS|Tu;-Rw-_bWT+(3S1%6km=BR?@{l_J^yd>>>v`q9 z?`YT4eo2JU{j59O2$V?Vrp7Wd(8Da|wM1dID1IHhHA!sF9J$Y9JFIrZa|z{cvO*$n z2Ro)pXHk7tSW}I48S20K!XQ({=2rE@XcxVPZ43|^Yqa6LGg#Wztf}`D^qoOXyVXBD zFu*Z6*^@c{!h|JZJxE`#feyB_Pu&O9TQ<^;!g#c(Y{>@Po3z|tywzmHfvRR&JIh;1|K8Z#7|ME19=_`AHo1+cX% z33Pn>1*;o{er`8--p}aW$YeZNF^6~TExIz5Mntcws3~JYzX00n@y{5XiB(Po!A1TLa zJI9xc@6~ZE+0_U{LPi^pmPi&IYfaU0s2YvDle7wexzWBJlk zl6*176<3neo0smW&%R~*b>b@CYWzx778+h1>YEcki!7x>T^c;r3^UaD?+c*(b1y%L zw?yqG{h4XG*>i&QS*nG<-pkBSS*hbxDLNHoS$F}5HVKDP?4%mVu17zT@#hvdqjuZR zuvrgr_K;?RdiF{heKcG3)ZhGY|B6Zh9aLA*eAQcK)fse>g=qpo4ZO71%TXev$O;gL~00#k(u; zI>?EX%iuWyNG&ebQ3)k-z&Lem)h>_4;Z!p(n}p}5PMl{1K%guJV;>Atq_;_6F15|K z=h538l(!Ehde1Vl40Ah8Cq+&t%n1=pv%}lhyUh8tB@?!g2mH#<6YOCZ(Ud|#T`>ID z0_sHnL)eQ}zjM_Jr5A5CDnoPo#O*$i{jIpAk?XDcT%)%^fKMQ96w;^Q1Wv(o93`XK zgAL2w_T=693j5PuPBGKFm)e3Iqb4W;Y3YRjHfr8{JE@p*t%I#J&c;L1aa#qyBztTl zh0DVAAn^e<$3`%I_i1x^&@Lk$;`MqWlaWtDTOwBM3+;b%%vv9dnMcl~*)KXuODnan zX2lBvgns6GOIDO_d$0$5+{QtZ3UU5~AZJQru0N1YD&{VhKJ2T~t~PSb2?zQ#^x~p> z9-sj$U^fZ$?XB#<6$8ccbEkbDWKEF|x_K&RMI=ZL?t<_s$-RXl`m7T>WEvfd6^TT+ z*wtg5>F)5AXP7?u{Pg`er^lFGa6w~YvBwg8(LeM{ctCt$OkOoS!mc#*LV_W?4c20> zp%FXhpAy`37v(1D6s+z!L#<3FiBt=c*&Q6=S0=kViJg|0q?_6CW2k~07LtijEa`S^ zNexR~e|71D_|cg|4ZHYCfkBKvWO8q@);rC)69?`-aU%z9YU=5U{=!5=J@1eW?|N)< zIyD;kbw*o@>xhO3{e)6WPj67yZjCvTxCH&V<3QN#w|OB(N){C6pflzZBb3Ec8T#as zI^f&({`RZsjW;e(aj9qk0v&XS$^&4y35&tXj+pKFvrJv{57f(Zfi5D+t7BY>Zu0a3 zF^87s&cQVwId-sLW+jM@JOzF>r+5Y{lb$#}qO{Sr=BHBCtgKXw-8=U{xcX=gJIV4h z52mFrp4Ip**q8tHuj$`W<9NHT6zHtlX0>2^mHFb+0*h}w!{8{bF*V)^;+lHlJ9~;< z>W$9}oG;a}{U+I{7LqY8QX>5*xMZy8OPX76N*spv>m8Eq^_IKjAcKb~Nmo@LD{UTh zQf`MjY|0z?aPo`us;AOPZ_L#q%_+A8~&3z!{J2llmc*^#<0xP`C{A4OH__g z1bXu~H|LaJUIWd6h(fC#wbLx3@Na=pvhlkcpQ!=u&LsKJ%GvQu{7B$>UjCuPc2Phe z9QO@3RUiDUs2{r(vrP`{hPAb1<#-tP)f%<;9~%!L4Z$8R--vJ2L{56Yg>AiuNbe{e2d2f2RE14v|Y-2>N#fx`G5p!h!+1uh_p76P~gg5f;E z{h@TXKo$s~3l8WR|HZxSoz_X=N7}fSfzD}KA9yA*YAHfOogdlMFx z5|NxKiw*=R?8Pj1-cz6>$G^wd(gt|hkQ2UwvX^=U2onPLSO>j}`@V4_-Gg}O@vQ$ZIllX-(^+oLq0-91Hc@GGQwcW0 zA8|$o5@XWSTPQHn&CT;Wm=e@{qk<*$)sF(-zIzZw3;OMf4J2sua4OHl!e z%8tPSKv{+-*>-B1d{X8r`AN0IJqsMDUEKfFw+ZE@ih+6GMR$%?xzVjR*gGwVE@jO> zqu!DpJGzMCpGt^3Phb&Bt))#P$oWk*ToFZ^Yen3`I?vqk1>&?fO=c-L{H&=Cg}j)) zioh5%E}VNz|CS@Xnu~QAt8~})eweikn+r7+j^R5QElS20<2RFy;S1LT{=}fHjHN;# ziAj8MuBfL6Co_#8Vkif#F8wzZYJUs#5@@v2@$&a76ZJ#N1;&2`{N|np+@@F|CHb4G zjW^~>x^C39$og_y^PS!O=e?onYSl6%YPU>y(JBh&`LOAV(GSc$ZNeL5 zc042%la+*Y=-g^?~9HjzoA(MKiJO=Zv z8rmjYhwTgBz*f5TzYN=2V)Dc)Oy^R%8Q=m?CAf@Z-rH3G6w{%4W@!xJFUh-zkL8Q9SDv zD2pwvz)M(H4=bfETojV&CrBcLbc&$13UwzOcx2B*K z4dJ*W%*g+XSUP6eX3SW;J^$=6kyBMu9T(Bm{x{kb=w~xrY6O&19{M9q@)r~J7loVv znkIikfA#T%9M56sJL#6rOejy*hSsLJEfy^(=#$t=`?ms`lC|#{KDiROMVrTbo^uNX zO9LPjqRnD%Ud}wbdm4j3npOV6Cr%W7pn03;jEkf-Uck}tA8@fxw8{WF&YX))#*i*- zlL}8E3hi>ip$?k5bEy7SC05A3c2_pohpUx@EoB#7BTfB|N&SgZu*a%WLBA!t>KPZ- zC>sKYRjIPOZDjZub@SVl5dSdBx>@^9Cn>U1UpoYq%V--sU&}l_=71y{48rKBap#8_ zv-@)Gjq_VTk$?W|@XD~ZHKkmpg?vj9&WPTgA9Beu7|6E=f$WI5co#_BCCL61|0@c{ zXS%0S?!`)lnmyX-+5&|gQdf2;iNnXq4t8lOI}p^9@V=j@I`SXB70ErFchtLJs3g&{ zErqVT^!V;Mh`+wUyL&g7O0O0H@t#udQ0V2w@0EO92}kutjlkEqzmAf;@#sf8Fs1jI zB>gGE+30-qiWr^$x(po$;a(w}$k?u}uEJ>TbZiTZN5}_*jhrZRC3|K)i<o^5j+Fg_5v@Gq=w68Q_>cI6*^p(3rh|8vgPkbnC?eklprRP$r6YYUcrHs@O&p_S0 z_Yh&tr!wZ9;@_P1S&MTg)^ZDd*56Ln!{$m*`CTboMIJd-M8nVN(CX1^=bmLSsq09W z&EV;2$}!Ki@QWj00(Tr<ZY7dh*7g%gR6XZu>rcOIP1lSFXidjlV%iLf zj2dmKPuu?DQ+K~Dh8^8-U}YMOX<0>jg$Fuy{rLfg_+*p2wOrBtZM3;1Q)&JiV~T%C z09;X>$^Pwgps@pM9vy&;EBR4U&jO1pJZ7=u#f!ukd$;?0ilFYZdk9qYo&<|o&Um(h zFuQO4>2yx?W$YJEV5F~qrcUL~LM7{2pkbX(Rh`Ss&aOS;%~~=APw2)lNgEZ+OJLe= z-90;ajXD|ZW;zU6sBO-IeKXi-o+;}$`1J$DH<29s$NsZ(U`@G8xF&PI-6i%q<_UdL#n(scT9(2 zGj?uq&v)opF3eVcZG}7UyxgJ2wDqrdkeYDXC-qN%BKGvFW#gSOe^Nm%aR)0-C%F#TI#Y(c2&q5CofW+_1z22=Il85GV$lF9_6s zudZl%k0e~ZJA#po>6<~*c>#mh0kNo4$oHq+@K@wxrm@SdWVw&GFn)s@<%ONI8gac= zv{R`~+m|ONuQ@0sWbI5KzBwdE{?=+cLf?i>eOjD~0y0%QXrtHrik)Tu?rEC`5y6Gv z>{{i-aRoznh}ylKhx96w^d(o5LFRul5acrc_QsMs;M>xhFE_41piG;Urj{h1FWT%T zGj7q!W}^h4LIU8)4_$!kWte)n(|&@x8U(M?ewrA5@zieGisfCf>4P#=UD*dlUb6im z7i3RQ_NRQW>rJ*i42K@%3iYo#shVgeVt=PWCsUg$wc3QUi#h%jLI)z8(Ca(4-{sn- zpp-^yU+pZLsoRZTJJa!J{Yu96fxcq9x_~2R-b~7%w%= znZB>*vpYs)E=G1(&Bgcv$xJJw0=!tlyq=rNI2G5+kr_$q4YxF_ zCB@YzY;F2PuFG$lML!;Pb?1$DT9&!DJam|&g!;;~Is1}O(hSw~4bDu=tAb{y8(+s~ zYtjZ5zVZZx0gW5CHty1$>PRg5FQvXnh-a91VWz0xobk=X+6>T;r2=`eG_RluQ;}E-PN1`hG!v?V0K^vdoHlSO# z;cY*v9}GRS4n2~xW|Fp%0#Bgb-7+$c5jS5WUCA}pd~X?Gzuh66BW5Wd{G}P<^%_8) z0dk{jqPuICqPt`zfu$J;^r0Jqt!uLiYIw0T9j61P%{pMU!-3O?$FkJOO|-I?8{@3um62C!_H*`1Dui(E)d%7Q z?1Qkbz^sVLUW){;9M#swzd54AS#uwA2gAe6enWf{zE>S1THa)}x=<%2>tyX4Z*eQKBCU5x(UoMzLj`^{rKNVPKym(KUTJBjo*stspB%_Wo{@UYOV0656w~%l0y2C1kT- zlhpcfD0>QJhS#7qPPMOF%!+FJOp!i)Tp9_pSfjAiye6j4D+(vEv^jsRxTH5f4OXpv zAXD{pb!bI+=LWI%3ciOOz(m~5Fjs>S)Oa_(<`m& zFsE<*R2QMC5}?sUocr!X)uT<@wryD(9$)RUqhIm!)yP}CQ3dYEE8kxg$z}@Ev8zPc z)^YSmXhM7yd5Ra?lm&A$`5#7Aax-$eDU`kW^W4|PaMgs->%0btSJYnEALT_VSktvjCwt z=uSat>8p%AYZ+oaJyYh^XfW$YT2SV*a~_aIpT(QWwf`uu@|RYC%vdYj$t~G!A_b-Q zmC&1oi%VLMPvyOuz8PCtySlF1LM7V6T5hg0_)6k-=&M4MT@_+)LHPZGm_X$y^iLWr z^^cu)JfqcaTvwo4LieAANmyNO$}b6@PdUx>*p-+D^n>JPW63$25e=|WD%Z8{o;!jw z2=O&*y_XZ7y;Hb@q*%*bHLevkkDbO45POX4;OkJ2Ula(>=w*7DsRpk#%$@H)Fvdla zbx+;}NAjYW&*`U{d=iDxo39uEInhXHm7ZS*$bGO`CrJKrR7SdA)bq z|M-;Vj(ih#4$mHV{hxn8Vzj4VE6oqj{}>yduDlI2@?a=qXz1WB`5cG{X*a|tBFZQl zU8J>9q3F)mzQKT+;pcuBKQh(xYeg|Z2kP@)lqY;!a!7ur3S!e|q8W(qgCm*yxqWG@z^oK!CH)rHg?CF_yiNWOmj|*T{_B+pih;26< z7 za422$12+l_X5Qq`4CqX{y_x715BxIvkIpQ2|Ts>Ty72#p2mCe6$5% z8OFz6KE@0*;MO0Q1SSEOQ?>95MAzki-loOQ5Ce1JjL2cvGW+?r=IQRUIQjPP2^+rcaA~8SWx(P%M+T(W4YU7z0ovmtL^Iq4-Ap+8vO4NiB2)% z7_IKqJnujE0rXn+;jDIS{2`?82${)u{B@XF7?#QB2|kJ2g~GI@{36KUngSZz|J`AY zpZgo5yT0^F{DP~{O zZl?c={^ramwM>^~V!hOsIp?l$rASDdaA z6yw5!S`Qn*?JqQOFLleZW;OBFXs%wEHOo_X+RCVYt(IwAESYfs=9mwInFdPkr@zDs zm<7f}ch0pql*!NAWol=VDfnl*RID4NPY3%}icUHehneslb5uQ zRvfbFFki*CSC~(Z4vxnaTF;zuO6%O zlpXahhGEOcH&Rnw1Um5_{L{CGEaB_E+?R4Ed=Em4dMVX6kE4%8_~q~H3KOJyByZ!k z?Uy7JmG$(Jbgm?UQiFg*LNTo+8Borbkw{`nT!X6XhE{SPU7Pg zW(kzRl}S7%uN>uqbE8ALpulYU1-43DtzvFXu^G+eROcK7iwbWIS>P;=vYG8XfvSq7 zRzW@H=TfA7<@n&!K!=1Tb)?Ce+qIKtQqn5!x@YlnzrOieVqLz0w&YxhUrK<)CDqZQ zhw68#W2ma*!;v^Z)uXR9PrFlW^`_gsEiRacyM_0+(k)Z+#|Kx#HbOVq2BFF_skt4^ z5m$M|i#@QdK$5awK7-`a{-K)!?*NSq|8mmC8U3K_iHHF8m@45rpd&}~Ott1JEuu>M zY9Sc(?*n&?v|j!9ko4$~(GETR58*s0NhfP{t&SuH>79IzjHYs@2uNANp%KZp?aj20 ziF5rN^u4r3^DO%phC~cU+HvrlWvPDU%52ru{l7VndRVcSG7F*Wph!J<^88!9dH<_DGxqf3iyLVNu@6pdZ0gzckk}38Pwkf)!sOC?^AP~cb z$s$Qo(Z}+r?bl6b3lAunK%o28ZG|{{DFiBtkW%{9{cQ;3W~D*D#0e7klir)39k=Dn z7ariy;pT5jI}_|=yeh60SL}K>CGj`$J#Dd4<9=`cv{VF%)`EXt6nMNp^fD=iIUxF@ z_2HFl-Z{=}h-g)Rh3g-2 z|9x2MRuc3=iuF4n$Ic+cT?p@bq>G>}LnFs=qJ%*CNQ_9%Vln@(d7$~vi#GhHUaaWK z^jr-g79F!`j4`gLd&)15!!&VxF&9Q?3pc4F>z%B|CW{$vlb-V zoSMelX7_Ngj=0vjm^j>aOU`#lR7ZNm$-p%8D z(d7sJb7%%edj)kx@Fxk#h%3zl{KqUoIeYF>funO=c?gsE{iNSzx^|o_%PW8jVNtC0 z=7kr588=!*=1{WP<4oPq(20*+Q~)Gn;r0S}KFZuRrh4g#sQLUUGQwa|OvPp)eW--~NPjlR$+FCOAN<0gOgFM@q z?IcEa9!p7*msuAhufELZ_|=n8kAC}}bFub3#OGA#ipsXDreaaqay^bNCu_f{;SK-; z{C_{+`}mBHumUVv!I_xZRi>$xw;luC560lFbFI50PRFOm({fRj^7w~_T?80(0XRQ! zt&ei-Nb@G`^6-2yQu+pYBOJ5UOZ3;A`ZIcmefY$Jy&->Y=x?M8nwJkPtK4zALWxUl zz?~YZBez!H%&wSCTf}bdzNr8`%%l0Z5`HEiG)qE`r}tjGOyesz=abxwtPTDKcamHY zqrm?EI(ZOinu~7Ii40a3{V`8yz`E{>ZF{9tPH{{!53cF$+XRjYN>kkNXp@0w-@9Z_8wU_wxe$9wv2iQH{vsJKNDTkn zPN$Tyt(r`Rba}`(25IV4@4ssEz9!%G$vmL=pHit{+1x9O+y1n-lFwoI zp@a}f=%FQ)kVFW9FYi5{zV|+V_RsySS!>OnHP7r>k*pAV71YK&#|L(?>2H{){&m#n zN%rap&Qgswe7{>t9+4tGGqO7Bt||y1|2U#8JZS&VFz3A*wdFcp^8qX=-~alZu3xdo z8IGISV2wx>rmxy1qBwbDM3T58oi4Z!uMRr++tfGpmXv-XRavoiw#gE2`Lceep&A`P z9QPE$V@|AFkB>=vlZ64jH+b#OhWM$RGAn+ zD%@{8lJNf=Fb`;AcdZ^wsa=4-ZlEU`QZ2#3N|dLF4k zL#fC@Ilz4J;Sdz^{xu*VeyJkk3S%7T=(5P@xdbR!sFCkE zn3vjOxSr$gQ&>;CRUKGqNK8{nw?Uo7Z%ul+!9o+$%VqK4zJ2QC_QM3^^}$b2p71Tw z$XdaD+#5e~sZWWrTg;Q-WZZ7+A&yv0c}Phl@g#0QaB2^;rWIVhW%_$8?B@~bWV8Ci zR|Co~d!%29$vp)A%(5s!p9ZXV_NbS^tr}JUsq!&#$SrC9rD)}*gfB953mpze1j^iN zd~xa$W)^wr9RIU~cV!&_mSyBZ{ZBz(a*7b(*Y+DB?)*2s-2-@+-HU{Fv209B}wS7j=l%4)aVI|Gv?5YbKw?XRvt6tR{Ry zmLZqtl@|TnZwI&OT<@=2dB1>x-La53xn%jmjR&toGC__ti>x3i4evYNPErL{LMYdN zGh;uijrm5LzMk;WXbmvDY~{1trWd)V^k(SqRqRALM7#3MKg6(MPZg<j`uK5{ozLe#R(u9W-5~=G^J!#LdPe53tLhP&|Ew zDH~M;gv(1zQ|`Emp<`4hklgMs`_giYO5oYQ=)Eae-Rzq;s0AlZ^Fju!P^#r<*!I^b zcF^z}Y2QGqtkq`7BQ>*yRz1bBz!O2zftUp2F=X*|>5;)I!Kk0*w&XZDx=yCaQc6oUf-+OgX{n-ZU+_QWBG=Y|> zSz93|2+Hr$R#P!lw-i+R88HWXJ+Hfu`g&U?@1$18<}x+2BTy>l6*A`X;~>e@ za3yMO$=w%*VMUIoV%n}xBvHg;lf+$YB2p@rT~{puFwt^Q!6j!`uHS^%-!AA9--sSm z!R47bU5zA6s;saV7t(BeI)$hWo0mlzO+5ze-GXBHs0OSTVyYK|z3L zNc4(949T{@$n6q$4`nJH& z)VmL!;Av{V?GnK`JtO^AEOK9IJ zWXRS&?gf838L_jvxfz*+6(eF|>Ry`73STk;M?5ukGiH$~UM&ThiH7ENA_^&{3LO*N zHttgV?RZK4bo2gG+=_4)j5I&0P2=sX8CDP~+RA369$;hY70p{>+ zsU{W9q-FG~tLIN>{}q{7`LUOZ{U$Cyd|-OEH}Ad$HNj}pxSbw@*+%0t^kgk9{3O{i zHtz=qJ*Z|A);WY)bi+&h9}89GH)rnC04mqA&E!nAE?IU=R-LV9D)cfD#yjH@>)M=U zyZ&|-a0`XGEjdlEA~2JVX!$mlYh;6n(jUP!$P9tkMED{0!L2^F=LhE$j5w;i3l-O$ zvr^+%Q9H{!sJicK-#|@r+>x_1j|4xo(80poO+hC-unr5yRBi|-0T5@py@U3~&W@Fg ze*5pt9r`(N^Nde+m3L9C-Gg{6rEi>IJ!YZ%cxm3H^;P8fILI8PWFdO}iFYOg7+zcv z*Xl35roeARCBLn&yBucax>OhClAU9xrW<7pmh0+{4G{y0aa+S8tiPkhw!BM)^{>h+ zDJJJFmC(#{!q9?i_3PYJwk&Y>~eF1hpn+z&)vA){dsU6D$n59GPGqvTD+lzS$s-i4?cwhjOypjQ8`t< zhPhedlG>8t_zP`oI2pzmJo;uTIlQ%_@LbM%UHY7dR8jhUC)o4cNE*zXbpOn?c0?XS zm2=gjzSqsHYd*Z&b9VK|i9o@pQj#@{($3blWmZc1c>==(qCYVAhDE=BJ)2}U{=aN^ z2x&2z^=z94fQKzb)R%LQ;)Sz4xJ=KMnx#5;A;FHSDb32Gxsj90R)u-vNKtL*5j`gx z6)~T{zZV*|*4$$}?=ks+jm3>I&u{O(<;7KPIlmus@2};Y*$joaRu63N^KDwx&)IBF zR>wtaCC21j+OocwkvF>{oZ%7q*nfwq&tCBqt>7v^*B_&?4=9~09|8vUix`uOYp%l# z%bMoVPd{qjlv%;8)Te^bQnW7nWWbyH9cm5h##p*@u zqQVLuXPpa|d~O)oT*>o41HZL+SCxhDGuzT`POFFtSn^vJEO;{kY>Su&#hW^p>qWU# zy0ELHc~bJ`@-xy0E}N|yf>?`?O{n%oFW#><{6b$EFPH%eJ6}0qcp)9$-{T$G|-RJYb;%jq$wu%V{D(B2+?6D6ZkxaOz)tL?f5s`UI zmG^Im?bAS;ODs#(37*1q4_um=_!LXsv9Im^Uwn^Q9&N4VMHQp27&k7})Ui_ucBd2&;g9=nS zpT`z^{>Aj?2Q~%(zf4ityJwvPXQ}sqAdkhqp;uL@AOc60*k?*1eM09e$^#&%G5`dm%T!RLf1M>u!|^rILtf4R{t0sS>2RMGyf} zUh}!?*8pPGFAp{kw_Hub7uZoGpvn=T7zz<`cat&|vHkvyN@IJ{RQti%m(BVtnwbnN{pl?MtIPk3YcEKAlPm}$a9&>SJ6v+5@ z4#vp?cWv$|md?jH(F1}6P`$A>_mCR1bjIsrH-CA?$zw6om}R$}Ol+z1%QW zT&QFPc?mSA^68Sm;?fj9N8>LaMh3FXmnY>nKY{URRmm>EO?6x+qTjhzIVhO+O_*66 z=s~Ik=RHEcD#O z4;9S2zkDtCwf`JUr%mfnnbKOZGR?``Z5BaV?+Za1N0mztRmtXna>dZLC8r;T;75!y z7A{9%Y0WtRQ*EIc5NC-{$~TPEm$<+;Bx4FmJLw(3!4i;ylHlojSBCaqE*Q_Oj!-F@ z_%7R^?`AyuXcF-Oyz^!D*Tep=Y=6i{bh18-5)|&E*A!?q=mgI;lO{-qr+VC;dHspw zzGqNRtZ;ITOyzoqnu9Aru8ZSy1^pAS#eB?K;A6+?m}kMp!GUA|xo=-V7Sgjcw#gTm z8lV4CR##*?^&M#PBX6veOwsb@4HET}p9Bh@&)bF^X9Ssqx9WvT?lpyztj7Ev_{z66 zrnkbYly_I=aPzx1MsmR(h8b>*Ar@&U+@2E53s`;zdEjvJ_q@4ZM~fAzpn^&~6EL5% zVY}kEX=CdrXEVYb%|(LL^s9xUJ=zxu#}XQuRbIhPX2MI~!6&C8$dt))KcPQ$3ekKs|vTo7#3^kr9l#?0#~+4(1*S^qpaZZ#5YtxVWT)BDqGc^d3t zt7;R^CSzpwy!n{80TFF-by1L(Be1DxR3kDY7a^7QCZ_0~Wr&@GB@?%5b7ib=t$ghI zCGfhbN#Ea^R8!A<$yCgqr@yWhpKr=N;z%M_jEl3==YUior0~uuhS5N~Sg>lR!BmqeTqvf~x${_);;mGMlH25NA@F zKiW}gyAtyerL^ws!u;pICsBgDyhx!AX0DGv9_0!DyZ3e%R^x3N^zSJVbc4^w2U;zl zQFr50uk>FB*vU_950w#>B8GmwIkMGK${)(|zt@cguC8pq|4EhtB<7{}*`K$XA7?I2 zm!$~Atw?$_o`KzmRBuwd$cnrJzQ6RqVG%I5jeS!rsENPGv3)MKX>7~vk5@djo|MWn zBD%b}AgdKzP_x&Ud7eQNmyHLmiOB^w$pOQPPK!t)XKNTQkGSzfTtbOW9_Jui+U9cS zK$Q<@H|B16-SZjBsS!Uywj0>6ZBB2jj@_H!I%gX@FrUe zh~u>lu7;`l#)DgIrJ2$~PQ_wY#w?8_n(?Pbfi!GALM-to2p&i1 z>85`QkZ&8`Gz{;^dqWwWLEs2wkJ5Xiw!{@y<4oE`c+9SSPNlCr>9~#GJj{(B*w9yB zHJ5(9g3?@VbZAz*^su#Au6wjAMtxj$1=X8Go9oHy*o>3 z^^v+u0meUH^cHguI8K*4)TeW`0b^wq+CuZTAUjUw>I8Qx5lkSqyBODkfD%a z2JPUn0lpL%s5;S=dMHgJWz=C2u}G=HWExM^s(YT#ZhYJ*i|Bn;>+nK*1{YmJt!U9T z?OYgBg%d(SfA@a3Jo!a zSCXJKrqB82NoJmt=}Fpks37cO_L;b^jzKHwbk$sy6I2pC*(`lvPnbHmsW(EvcVbk`(i4)c8~T zJsscJX_uo*@sFZP-+u6YiR;_$It=(qD0VY@S!o7rWKIj&1)q(QYh>G^h%38skoOD)5c`()hO*|#PB|5>?M2UZ0y3@z|z z0p23Ycgq8aV(w>tKs-hsL|0nH+MBWr(r;M@}Eqs3C5fMHAGE2vxG#c=dx|`1pw#(&(CI zfg~*0L^;{QA zJ`p@&o^wVr9~B~eXguK+?0!%R24B#c9F@!DJo>$&C}#C#0v>_V3$jR(79u^xMexmKrhe0l+Wta zu<9q*v8$IPkK^W2-PcO(8x)dbabr`?%NN7DQwLw5UDCv!>c6hC8fZ*uzO~|+ewy~S z(t@D19J@P9V(#vdWIzo(*A%~3?YP|=s?t84@w0p28%5_vFHb|KjGiB$aGu3fs93O%fq#q&=&&5QR9{_`mkGZ&7o08>9roa9kdk2#mH8a||9gEIc zo4;j+yZ{Ivx;gPawy1x#5-{iCO0VVaHa0C^^z3W|gHV@crv@Ib@1&dHY&FNQsS4B_A4}X#^ka@XP!Y21Ew`-8iQQsItr@6=KAb8iK`5)?~_t~ zo8gf1OGy2P-Ckc6NO5jxys-8T!>U=L5X$&QD%U%?7&1_E#0S3~o=R^LRPj*mHvo`< zA=|L9)$Q0%i%*wqnV6(fzw{D6P28+(&4^2>?J?$M0c6UP*HLp_78%v7q?T8ocPWT8 zrw+wM6fi!Ks1=Zvn6c~|>@WVC!8^cT%|WWj`JN1lRzRVs6YH7R6kg4v(Gaa`;>;jO}er^wQf7VGw$>V~@}>n~B0W zzICjj~Ba*am<|I~G~fQ>CHMEMz1>sYBn6uRj5^Y7&W01M(69E0kc=f7Ot>J%yt_vB5i7{hF{<_N(Kzi{dFlpO*AR zS<2|A(3os`mW>Tjq|kRF`svM@+2wBZ#bGItt6kFP8UsJLHn(d9%VG>&sFovWL%!Xp zILgVH8KuD6{fUK!Z&Cv|f^VQh$-YJqpZmcji2xx&EYt{6(#(oA`x6qqbKJkAKsubW Ucd;bxKeo_Pf2LOc_{E3+2M+gNX#fBK literal 0 HcmV?d00001 diff --git a/config.json b/config.json new file mode 100644 index 0000000..1898332 --- /dev/null +++ b/config.json @@ -0,0 +1,36 @@ +{ + "architectures": [ + "MixtralForCausalLM" + ], + "attention_dropout": 0.0, + "bos_token_id": 128000, + "eos_token_id": [ + 128009, + 128256 + ], + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 1152, + "max_position_embeddings": 32768, + "model_type": "mixtral", + "num_attention_heads": 32, + "num_experts_per_tok": 8, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "num_local_experts": 64, + "output_router_logits": false, + "pad_token_id": 128001, + "rms_norm_eps": 1e-05, + "rope_theta": 16000000.0, + "router_aux_loss_coef": 0.005, + "router_jitter_noise": 0.0, + "scoring_func": "softmax", + "sliding_window": null, + "tie_word_embeddings": false, + "torch_dtype": "bfloat16", + "transformers_version": "4.51.1", + "use_cache": true, + "vocab_size": 128259 +} diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..bbeeda1 --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework": "pytorch", "task": "text-generation", "allow_remote": true} \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..6c90e66 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,10 @@ +{ + "_from_model_config": true, + "bos_token_id": 128000, + "eos_token_id": [ + 128009, + 128256 + ], + "pad_token_id": 128001, + "transformers_version": "4.51.1" +} diff --git a/kanana_tool_calls/__pycache__/functionary_kanana_tool_parser.cpython-310.pyc b/kanana_tool_calls/__pycache__/functionary_kanana_tool_parser.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..4c95b959884e430620d1ea31f1a82e969ea67803 GIT binary patch literal 8112 zcmbVR-ESO6a-XlAot>RsE|(O)M9C}5lD)P`O3~Rm`(#D3WZhYjX~$Ad=Rusg(e{vB zaz0i)vy!-&H5Ajqy@Y^(90DZK1r!cR;HL!0e{iq&n3rIXw>&vOfIQ_x7mN8-&+d|x zWF^QFTiadTUEN(>UG=MGRH>K}KC^#$f9-cJO42`5W&fvu$_0Gm3$i3JiOIfX)34%7 zfo#ixVk>gaS8Y|aYqo}8)h`6Pt&29zF9wEf1SPu^n6?>|?Q&q*mS`*Zm7r=@gE4z- zAg5;6Fkbh^gSuT8yrMr5Oxly8Z1{(QDSIlIwx@#`dnTB*XM;I=PPCQ$!@;~g9~`ld zh`Q+?4PLTe66Lbr2#(puMA`CR4vyQ$MY-a?5}dG4h;kM4oU~8Ml6TB|bxXEi`=P|f zSnVr`)x7GKYBy0IXLZ!;UK91#*#w*XO0wTzhu9Q;-}H{`EU@WS`H_sCGi(+;XTA9? z6|xqYd|hhJeM7okZYtT>)$1QGU-nuN^FH7_;#ql*!JBfXec~o-%|fPKZnu(5yVj1A z%=oyIw4>1Vv%>F%C}hTU?{?PRoz>0!rfL9c*$DCAg6HA_oKTgOn<_? z8{BP&9=j23cwxKe@%P=>!yJb$t+~miDCqbe$^VpuV!HVc?g?2mAo4G{zW-sk67j&L zPMLMt^Aq2PnQeGlAnJ8UP8AFbw{%G?cE6gb^(oAzg23^zynL4D#m+ia22_kUDWF5nx_ zfOwKEGs#vwmB~!`O2T1jOvPbonMDe^;XyHO;{Habx|OyZ>=0%svP{np}H_sp$@b{HoM zzxCFsvrEnf8ba4epmwK)BZ-%u<*W>j%;lR0`gg=REp|4uN$$m+D2zP_a)SK4<5y_k zqy$ar9ow&^#pm^2hLIVL6S{%tIGO1ug7?hvj(pbl(Q$aZO!m|jg(*z^iaeC&6*(Aaw<7+oS?8TP%HsdWf~}4 zC8jDY_uf30#)-=lXU%h&$DKAy&&Qjvg5X^0;a2Qpn`ZCz=kzA?cwXP7=k#^s7!Jh^ zljjXsc+P-!XA=%3d`|affuF!G?Ml8{7zvz9Y?o;{!%A&5-;h%lMw$2hTH*7MAjCX% z=43VE`a7?qM@*qg*K|dfb=j1ACth?ui^Gv{D+3!Bmq6UROy^$G<>7&oBePNQ6(@HY zg;d_bxjmBmN(#f-DDXxKPmwBrq|8b?@*}CQ;%sr6(+Gego|dX9%+PUbC)h%FFPHsqQ-3Ds$G@7)(F?}Y*nXpIEZg%ny_!xmF%U0RpPm#(On zrO#{7p1cDMK9cz~=`T@JWlJs#jrHZ*#Z~B$seS0Ik1N^Nncgp=kGv(b;)ce5j?r3L z#OSN341N*(d@QbOiVOQt>6cP4{?+Ly!2LPh~HzC@{% z>Nry~H6g#i`$B2~V@x{3emRwP%(RRiFOZ6JH?bCdOCFv*W*JYlR6Z;9wXjYl2G>G0 zl&ryuY5jwJ#jmAW{AY}MlO%1YOzXyq6#h%%rfU2*_*GMt|1GOPp315Z5tXRS#>l#w zwdKbqE+kHwoW3IG_uRIp8=?_XsvSn~;Ip7jBFvwL4m+%u5dgTNTGlfHaq$CJ|Tk?u>6V6eCGuV7X zmiovcdXor|%DQ$(;wO{BmN5MtJ(V8GH{oACgEQ?bU%>3Y9F*?LccrGX+%pAAZ4iEH z7PARBuB7ey&U#E3G6$OlKXO^jFJmQ~LUX1D@hVrTWODbe!vqWm-Yd1kPB(GL;tDIi zyBcS*m#JvprxAi8S^dB?Li`_sAJ;(?c?!tHM2MP#j*R=tZ}^YFZoxH=iiOMdg1G1-wR!=za&Kbuiu;ZLL-9qDm5ABdX@fRTbv6TlzwE_pa zqWnx+f%6B>vTPkVs|cKBFx@My0A(=)ILl-ua7}#6_*!1svu5Gg2EWz8Z$3)(Dr`*1 zt+5&#$LQ+MU^n&{9AG^=`rHdKN;8DNIbfP}{A8YV`0*crB+?d{CZfD7!88%Kwh5`J z0;wSnK)E20n$8L+7a2^_F;)@foKh;UoA@>Hi>R@V9;~>nFk_Zl;q$S?5;B4u*qp^= zoB%0*2jt2(yZ9hmsJo0gamQ^fyD-Gv-m5P@ z#62KqA#Lz{C+a4+rCE{Zc`7Hb)S?3&e&~S7qlw!^Dkn&iA2OhZoT~6K6A2(4f~pM5 z14!6LXaz^Z!K$nPp5Qd~Wf4qn;Lcg3L0l;0Q63Xq5!9~ap-ttVW1c*B8AGY5iLD1N^q28>L8@mYCU1-bN{ zcGN}GMQdh_&Yo%}RGJ`3q;h?)BcXU4ah#2hdXHFRgCRr4a*KS~@I!%k^-B+w-phcPCcfpi)VF&72%uR>E06#fx*MTItQ<{ zv^J8BHuR}cj|2{ee#Kl9`{k01eUkrYBA)s+mL~haZXCBOzO(~AJQu7Wz@?%<4K();cq-&<(6=ZRHvDk1&I>>_gr%P zZ&%^7x8yHL9{l$}s<|_sTI5Xk*0f_`?GspgJ*|^gpz-=ZD-#2)>S>waGFoOreeZ1I z-@Pe?lRycR>xb5-)~6rHn`iQfn9S_VvMSB<8O2Mu+Ph>ECLpx7p+U}t6s~!FZdM9q zochG5O+nkWe8h-H{eP9$Xbi&{2^qf-lK>7jIL0Q#rJT5IX_BcPl_O~_W~lB4M~8{d}KUt)DOu`RR7ZDmzvhqmSZ z%urH6f>x)`B37M~!UAk`CRB(H);%@@J9Xw*3Dlr5JL7ChgfY?$-L5&BF`Xf#g_`j| zj{jBcf|489A9nFC!}ZW>WzyJ^{zCeNg0jKyj?dpa4c>wpdp zY6vShMr%Uqoa=EGW2RFIoZvlB_~HFJ3+K{V@ZJ(KW(QiHLytMw5Ak14QQK1bhttD* znubnc(`f%3I+`BX0@ePXS|=NFj^!GJ6&`<}Y~BZ2od;SS$Em);=12NILZzEIPM!Z^ zo-7jkLrLJ&qXYvkz%lag5uuD+M0x%$mFR7Q+e9e2zXDWX;R&V7J;#k(?KWQkH!}e_ z5ufoa821)LAZ(1@5*xRoWUaB+p@ApT#^`;a_gWYw4KIwkt80xMV&I3m$6f4ZxqdIG`w`?YJCdi}A7_=1T%R7=Jw^wU>G|6?WO%o_tNa!XQde$vwOK2t0?WuvBgtZQRLX{o?RPeAi5aH-i$;pTNn+uC{AvMnSw1?9!XUq(<)wCNQD(YwiBz z+w_*8JgMp?5Vf*f)pWV4P0E%|S!fj!@ydX47QI8DM#vlQ6Hg#@SJSa7j52n06)VHj zs)Z3i=qioP`_sHRS_gfieQWF*hOU?e>;`MmcB}N>fq5yN)G!Oi97w;S-N6b-GDP!*a;D5;pUUVAG+S5-S1W$Q|$P5umP4dT&DwPPY^9>>;kW7V3 z%+wf?FNOe9#>F4;y+tA}{{)!{EneV~9)#3!g^M9$3pRvi|Km9baNWNz=%Kc96$1J2HVJzGakA>2* z#vR`e7IClmX8u1XjPOFYz1ZPV615_q@99xEOL9lTG1>2Y*HGa%L9%W7gV(X literal 0 HcmV?d00001 diff --git a/kanana_tool_calls/__pycache__/functionary_kanana_tool_parser.cpython-312.pyc b/kanana_tool_calls/__pycache__/functionary_kanana_tool_parser.cpython-312.pyc new file mode 100644 index 0000000000000000000000000000000000000000..802b96f4b3fd92cab23c1d78da92c8f25fc1c426 GIT binary patch literal 13786 zcmd6OZBScRmf(AOlF+vV5=a680wja@GzM&p0e=8?`~gYFPIs(HMe+S0Sg>g6q|&^6hb>VKq7 zS9hggYW2}i&2|7$CG+_;`WW7wE5 zg-r=_*qpG0Eu>5rw?o7DCE&?0k)rp#LO~M^^ zCp=+K!W;G`YQwdp%owjr_`<$KeYl>aP4R|AW4MvP=D0u66mBB0CElE93AYf~8V@9b z;UIx+(9ew>To@YK(RmHOo&TRlsw*a?;zz~bh7DwdB5mBZbObjb5-OihI}vi;K4m#4TLkrukhS8J{n7M?6uS_E*V?m_;XQ#gFdRq zZbs8%sl*+`nZofZ(Y-~ZKnJ&9zxhmEGAGeS@7Mpv}==+Um}_=1q;_^xQz zJRj?cC(=C&KtQ1<4rJ?@zR6ABnoq@&X`v^Pf}E~&??Cs7Xy1*l8!+^)V*^J|^h9n! zK{6Ui1NkG; zaR?m{+@W?2RBg+O_MUC0esV>-WvG?vE@JGF{8urqm+G#pXg@J{h=_sWDy$x|yvUlC z^*one;FJ3V09i-`;2r=Es0=+ENe0#kGI}{$#rKyOJy{*)Lc;v)cRCW zYb`S%QW}<7f+Cjsn!4HylhLx;_cT{2B0@4f%A>&j8i({DXewNQvN6ifE}#k%P87cUv|h8OW062O(R)h33ak;YU5uC6WEKn&Cm0qY_*idLffu z*meMWdkum+l;mj6J6c6Y>jsl^bgt+mvt#w_zZ{Z0?Hk88CbFJmdC#Ee8O(WxRxV=Z zz-I4}ic}AhY7u>ukI!CjXQOWKkJl@C03h0XPu>nHhBQ*yZ2fw-E z@-3CHG^?3m#;NbNP!w>No>O&EsS0peH75l6UN!PPjs20YRAvVLF4OmdT56VBW>{t! zc)6@&b<28Izg$t)q9{#l#jSCQTBUjH*QjDF#hD7VU;ccCF2hjFN10kSu!f9*HNK}= zHfESPbE&-wv8J?Dh0}Hwnsca7DOPt|wcm`9HNVHGDKO)hWjguS&l#;wt;a7z4QC0f z3T5{{+GIV#EZL)!97tIRm&*BfKmvHpDt%9r(F$PV1CEBW{}!?3pZn5z`RtQ~br$T9Vm3G_a!a@>=?vMYN)YKAQO%&1I3v8obA zzA_K@sEN_9Y{MC4--x86vl&G_$$BM=KMv!Q4QgdD*0kxxc}~{ESpGZ|@u(9(eW^PY zR^U@{POg|vfkBo`%chb&1X~Dh$^2yqLKbC1GIA+F*=}S5?4ZKivGh%uiE~NWM0Q#w zLm!==hfn{Q!dzm`=^}R}i$K>WipmlWfNM6ii>z zEzy>;sYC`@i$@08s!p8jIIx@-hTNsz^Ce5~k1Ur%4LF>H z@IPQ%xI^t!dmp@c|IK`Lmss7kk;#rs>bBzbCAtUEQ$D`v^*UolA4!4=aNw#wD+oULj7Y|a)W z*xE#U+eYn{y+TZWYHS|b<-Y+Y()iryJzOri9Ml}cS+oa0Id}X^>*}idVtMY{8YtQ?7 zL|@OQA?G`}YLuM5b@~URQs~6bna7uNgD-u2G8=j=>pCI@+VX+(V&HuC!u4DrygIq# zYRJ2SqAR!)=-zG)e!%{C?niU)$8*hnQriIZ>aB%dt81XwBmJ8ff5|*~=@(Y9e=^(u zayIzN{i$6&Ro%S)rs(Qhos?YO9Y_6o!zL{@9TOeLR;@@tdQ+2a>RYw#U8E^{Re?BL zw&0gnXv$G9`TXxrZd)Cz_4&$xSQ*Gw9?4l-H+r91JE3T0@>h1R%NskG5}oI=mUCoVn+lou0PvR&VsHe5S`3b2@G1sqx%22dP=py}h;PLJ zwy=UV9zqBM{0Th}+@*FkM%^U6<8FVZLtwW?uX8L-?6vR5wN| zxUluUZB`2zWSjl306d_KRJv#`9k#h|X2r;lRTI(d^%@s{hwrD`S$g z=E3Ow(e+Ty+4+g3bH`Hohg~yN{Yvly@^}0#)ceM>e&$iz**fO$Tr_}xS4$&YrvrGp z$XBRb^>rU~PcIwnE*e!*1qpB#& zMud588g+tl!X@XjkQGi|3-cVW=w?)wvH{Nb#5V;_6O=2}aww#Pg&A<6$>vCz`A{>x z!1G}K0BZ0C5hsg)){uQ)KA15zpi?+F0Eknz; zr~mQdmIqGd_pCdpGOfdS@@jEmGhJ#=cz*eau91cD&7bZ>Q+(#52Cs z(3)@P78|-Z()pg#V$W&m%)~B3HTFEC=*A1Qbm65h8M^TjjR*cZvQ^0z@K$m0NNOPs z+E=dN6^|)@3_isdZ|ElcYH4tI2hf!(OGv_8N)1i54}Q;!(c z(|omT1+iL?a)#Amo$?wX{S+}guc3DnMF7+scmz3?L5m(}MZk!=@i{hUQFC9oW-pTqkxZjrGKyfpQ&v{F-!XL>e4@ zyeJM{#InmY7G73N4%rG`=C@+01+esC46>!T2ry*=7N@~&if~n_B08u*)&;q;Si6{I zFEmjzrlyNp2PT9Xg-AmUSP&o$n#0^bpjQeu4Ad@us+JVaJ-1a+FBTgWEgzv3upUx= zX#XYmgQe_f$doklRdjfi&#TZO3$7>P+&B$~Qv-~%Xg!sUr~n>nLm7&*r0=!7xIH*U zimruBu^n-WXzrcW;s_6MIPi|Ny0ub=Y5io=i_6POYf5ucAv?7Md)czlh%Olu{LC?G z*N+yy5&`W(P$@1e^_Oy0C}Uxbk4!3NbySdR7=|ht+xK-D8>Gx6Wu9wM z+m+&UP=#@%@UK##y^2eXY2-_#LNV3?Bd2($G6SLF61aWTbJ9CB^heCi;wVgq^_#Jj zVOCebAuGj~(t!`BlcYfxIG@wH4O-KS> zcj(6%=NzoggCASesLQU5i~o;bBYm!N>07QY8!0u17Xb&p!$*WvQYpGzlc~=K55q6tj+uTa|k_K@=_i^eMH@;k~8NsYSkw`%$IZ?;Px02S2vzky9;yZ zr5{zRxyv5t;~UTOw&pfDyk*=df78sg23KWL2YY}giOy6{8U0FfU|$030nQS&>iAeA zq>8)n;UhR~#j!Q&xPe|Trmg#M+Nm@EUEm?Mz#%)W5PObfm7M9I)%jPyImcKJ>rJ0k zXRqp+zo!13ri_=4N44tgzLuAD9~JhH{k&wW%IUgFCp(ZQ5Vt;OMrCW|0Qde0Qn6q9 z|7q(DxP)iP1K;7i!+ySI#d~2E?hIarJV%%D`qJu5_GG;K_AdW{VL&qD-KQUFp>-{> z2`bYQYV8cE~+J^nDv$L zl+`>;Q`eVj5)Y~GPkoE%ABDKgKiYu)k;~8lkGhyYg8`n0coY>LC6Z5Kfco}4zW;&O z0t-ABi3-!P7>|1y+?GUna9qHn8DXi59Mt{A_cs0;sq{^Mse&IK6ZwmG+)HiARNBua zQwy^<{fh4eBCIZOet2Y)^5Y{d|00(r*Go$^vrxU*+Rw&jW`_Jh0cL>1yGDk08y@hm zTqK!F!YeHvwUH8$yt9Y=}&TRL#L^@Kd9VfE!n2wdDb*Idb%*X z3tHkd;XF=|T|g`^VStQV>L4$T{Aqp>(ZPss!VKe_U-9NBd4L_TE*;J<|#=yT--4Bo^dxccHb*~HzR z=Ey@hLAFjtupKMaxH`o*J!3=V| zFL^A$<;C-O!jp{?YG-iArh=h*#TD{>MEDK{e}=(b4E{L=e~tnANO*jdz)wQ}H+{f7 z<$VZXhgWSS2eZtiZp_I>ZLGJk=-=VsZBWg~WH=@vwYy}4e zdhe769L1zS9NPF44g7vqwLF5-iMypYIqJJBGKMBa+jdcLqdfAn)uEop56bdE3s$4bzshFKg+8i^ZB+yz5+lBilEg zb4}naXI7+VXAm95}zG}?CcH#J6&vl-0N6tB1?Un#K=W*71rlSJNleHLi~DxLejQu3yT!d-Cof(LMCI zKY!}7cbcF*|h)>&<_4QtBLh?EPimlXU*V>*9si zb7R-Vlh?E1=`1@dhG(;#H`gYmmZNLq@Ob8tbK_dRYgFtS&4o_?vgJu4ckY@Py0-P5 zaQ08$%zY;!h9aUb^6(-Mxv^t^m*e^2NpW~G*D$rlNQI7l!40SA>s*6(Ie|Srb!70d z<;nFY;q2fm*;l`l3%-7TYW3<`tK@FpXc66A+Z{bW8TxSOr|f^4`);|-L2A*c1WLpXx?!(=3Pfb*O6^c+lFs5_QWV19|3>wS$cGrqT5e{ z57>K#-eWY?XYm5Nx?$Zdy4qH8=$^p3AiCS7#`et?v2g&Zd#})v@A5MSfo$WzPDl4f z2Bb~x+0~SHwL$9*=a#DrkhQ_p@aCm#>*;*!xY#=W+v3ExbFJUWx&o5Bb>rAm zcUO^#Lt(UjX?5RI*xzP;Nt<#Mks=bXU}`l&Mn zvenwZIiBx-2|T1vk6e^`dLhf&0RB;jb9E$VZ(9G>Q~MF13*@jrz1^OS``#)@d64+?Z zwO`n)VCpZ@yNvE+?H;9Ts$0{+Aiec@PoL=NBRwA#eMgZo$E1OCz+Uedy$Ad{1{d*7 z!H2pXpMQ1Yi`MpykzDJ^$7jXXkyY)MBOrD6Vca1(TzN-_=;+8h@P>Z#*p}n?wxi~O z<-R3be_Wl=mSa+K`&KQ0v!*s*ee`MdQOVz%_Ya8vfz6qme`MAAsnfshYuok&H^%dw zXT;7kQpbSQaq{OKKkItjmtSXZ)U*4g<}=jL~Fy<<`>xMn?!^qpH2ijDZAsPp9bVg#N0# zrQT7PO*Jm;>TY0FYyZmlmZe2cODm=$Meo{(K-GbxHIq- zIeuZw@zSU6x?LS){$cM5Lpi)~FK+Z~TdMLFpJ?%A>o09tE<^G!uDp8%Zk;MUpg^o% z&|NMM-isSOUkPaA{-Rrd-Aw&r;6mVaBlY)nU6Ap;HgOfBFQ*>-N1aRqXGW3 zf=1ZDAZ#{<0d}>A8AfJw0EZk0-*Mm#CvU?54}E1XI?!=Wu5|c22;r@S%z$;Pm~a09 zlh(rB-82`EMMqgi!ED>40_^%OFgnkUyLMNH0I&tX3Ic-8_3Ro6Xrk(a z>sKF6?wU!`LiqygV-H7mtt4rqYMa+v9@g*LNzy@8weD6Du!=I-S2AnYvi2s?*!(*u zW-3oka0a0s#rk9bR-RaZojJeAUxl<>F%N%+5s%&Ab(qq_6EiSYl;<$$Yf@gv5K1d# zjNX{$%~)W;fLN_~d^q^PqZ=*R?v!H1Dps)tZq1ScF=lyz@J;r=6^|#n!Aj#7l{fy- zf=fnY-Sd1ZotjR?`4TIM>5axMF>~dU&udDoP;#K*g>Ln)MHG`v$>m*$1m8i*?cWH= zLOK=~6l>W`8Yo6M??x0RlA}~1mUa`#D4%PDly;Nj7XDF+BChD?QY88Z2>CDwVL*-x zcrcLdJU0u^(BYl9^0xy-9uK@tk`2R3;VA!KpbZT_0ewgCJcFkH7iIpO>Vgpde@1ye zrv^Wv20y1-{(-9fj5_wesiVKs=xNPwDF}XNqiB}?jJo(4)$$qD{24X$TLVRReW|BR z)vK@Pj1716dj?Qvt9^SEM0=K3X?l!aAKs$~@SAy!fv);ZjgGDcjjd_P(p7o7S)`k@ ifst&>XpTO;2Y-P=d)C9xD2$&ml;#ZmCCMX_`hNi@Oo#IT literal 0 HcmV?d00001 diff --git a/kanana_tool_calls/functionary_kanana_tool_parser.py b/kanana_tool_calls/functionary_kanana_tool_parser.py new file mode 100644 index 0000000..2f7882d --- /dev/null +++ b/kanana_tool_calls/functionary_kanana_tool_parser.py @@ -0,0 +1,401 @@ +import json +from json import JSONDecodeError, JSONDecoder +import copy +import uuid +from pathlib import Path +from typing import Dict, List, Optional, Union, Sequence +from abc import ABC, abstractmethod + +import partial_json_parser +from partial_json_parser.core.options import Allow + +from transformers import PreTrainedTokenizerBase +from vllm.entrypoints.openai.protocol import ( + ChatCompletionRequest, + ExtractedToolCallInformation, + DeltaMessage, + DeltaFunctionCall, + DeltaToolCall +) +from vllm.entrypoints.openai.tool_parsers.abstract_tool_parser import ToolParser, ToolParserManager +from vllm.entrypoints.openai.tool_parsers.utils import find_common_prefix +from vllm.logger import init_logger +from vllm.utils import random_uuid +from vllm.transformers_utils.tokenizer import AnyTokenizer + + + +from transformers import PreTrainedTokenizer + + +logger = init_logger(__name__) + + + +class BaseTemplate(ABC): + @abstractmethod + def response_to_messages(self, generated_text): + raise NotImplementedError + +class FunctionaryV3Llama31Template(BaseTemplate): + def __init__( + self, + tokenizer: PreTrainedTokenizer + ): + self.tokenizer = tokenizer + + self.system_tokens = "<|start_header_id|>system<|end_header_id|>\n\n" + self.user_tokens = "<|start_header_id|>user<|end_header_id|>\n\n" + self.assistant_tokens = "<|start_header_id|>assistant<|end_header_id|>\n\n" + self.tool_tokens = "<|start_header_id|>ipython<|end_header_id|>\n\n" + + def parse_function_call_from_text(self, function_call_text: str) -> Optional[Dict]: + index = function_call_text.find(">") + if index >= 0: + func_name = function_call_text[:index].strip() + arguments = function_call_text[index + 1:].strip() + return {"name": func_name, "arguments": arguments} + return None + + def response_to_messages(self, generated_text): + # first remove stop tokens if there exists + for stop in [self.tokenizer.eos_token, "<|eom_id|>", "<|end_of_text|>"]: + if generated_text.endswith(stop): + generated_text = generated_text[: -len(stop)] + + tool_calls = [] + text_response = "" + + func_prefix = " 0: + if generated_text.startswith(python_tag): # check if use code interpreter + code = generated_text[len(python_tag) :] + function_call = { + "name": "python", + "arguments": code, + } + + tool_calls.append( + { + "type": "function", + "id": str(uuid.uuid4()), + "function": function_call, + } + ) + generated_text = "" + elif generated_text.startswith(func_prefix): # Check if function_call + end_index = generated_text.find(end_func) + if end_index >= 0: + function_call_text = generated_text[len(func_prefix) : end_index] + function_call = self.parse_function_call_from_text(function_call_text) + + tool_calls.append( + { + "type": "function", + "id": str(uuid.uuid4()), + "function": function_call, + } + ) + generated_text = generated_text[end_index + len(end_func) :] + else: + # TODO cannot find close function call + text_response += generated_text + break + else: # If text-response + text_response += generated_text[0] + generated_text = generated_text[1:] + + if not text_response: + text_response = None + elif len(text_response.strip()) == 0: + text_response = None + + if not tool_calls: + tool_calls = None + + if tool_calls: + return {"role": "assistant", "content": text_response, "tool_calls": tool_calls} + else: + return {"role": "assistant", "content": text_response} + + + +# partial_json_parser doesn't support extra data and +# JSONDecorder.raw_decode doesn't support partial JSON +def partial_json_loads(input_str, flags): + try: + return partial_json_parser.loads(input_str, flags), len(input_str) + except JSONDecodeError as e: + if "Extra data" in e.msg: + dec = JSONDecoder() + return dec.raw_decode(input_str) + else: + raise + + +def is_complete_json(input_str): + try: + json.loads(input_str) + return True + except JSONDecodeError: + return False + +@ToolParserManager.register_module(["functionary_v3_llama_31"]) +class FunctionaryV3Llama31ToolParser(ToolParser): + def __init__(self, tokenizer: Union[PreTrainedTokenizerBase, AnyTokenizer]): + super().__init__(tokenizer) + self.template = FunctionaryV3Llama31Template(tokenizer=tokenizer) + + self._func_prefix = " ExtractedToolCallInformation: + result = self.template.response_to_messages(model_output) + if "tool_calls" in result: + return ExtractedToolCallInformation(tools_called=True, + tool_calls=result["tool_calls"], + content=None) + else: + return ExtractedToolCallInformation(tools_called=False, + tool_calls=[], + content=result["content"]) + + # our template: {"arg":"var"} + def extract_tool_calls_streaming( + self, + previous_text: str, + current_text: str, + delta_text: str, + previous_token_ids: Sequence[int], + current_token_ids: Sequence[int], + delta_token_ids: Sequence[int], + request: ChatCompletionRequest, + ) -> Union[DeltaMessage, None]: + + # if current_text does not start with function tag (or python tag), + if not (current_text.startswith(self._python_tag) + or current_text.startswith(self._func_prefix) + or self._func_prefix.startswith(current_text)): + # for cases like "The answer is + for stop in [self.eos_token, "<|eom_id|>", "<|end_of_text|>"]: + if current_text.rstrip().endswith(stop): + current_text = current_text.rstrip()[: -len(stop)] + + # if current_tool_name is not sent yet, + # don't allow partial sending of strings + # (supposedly, openai also only sends the entire tool name at once) + # not really relevant to kanana + flags = Allow.ALL if self.current_tool_name_sent \ + else Allow.ALL & ~Allow.STR + + try: + tool_call_arr = [] + is_complete = [] + obj = {} + try: + # set start_idx + start_idx = 0 + while start_idx < len(current_text): + name = None + # set function_name and move start_idx to the end of function_name + if current_text[start_idx:].startswith(self._python_tag): + name = "python" + start_idx += len(self._python_tag) + elif current_text[start_idx:].startswith(self._func_prefix): + idx = current_text[start_idx:].find(">") + # found ">" which means function name is ready + if idx != -1: + function_name = current_text[start_idx+len(self._func_prefix):start_idx+idx] + name = function_name + start_idx += len(self._func_prefix) + len(function_name) + len(">") + # for cases like: abcd and , which declares the end of a function, + # move start_idx to the end so it can skip + function_end_idx = current_text[start_idx:].find(self._func_suffix) + if function_end_idx != -1: + start_idx += len(self._func_suffix) + # if hasn't been generated fully yet, + # but the function is complete, we break out from while loop + # and stream it right away + elif is_complete[-1]: + break + except partial_json_parser.core.exceptions.MalformedJSON: + logger.debug('not enough tokens to parse into JSON yet') + return None + + # current_tool_call is the one that is being streamed + current_tool_call: dict = tool_call_arr[self.current_tool_id] \ + if len(tool_call_arr) > 0 else {} + + # case0: if there is no tool call in the array, return None + if len(tool_call_arr) == 0: + return None + + # case1: we are starting a new tool in the array + # -> tool_call_arr has > 0 length AND has more elements than cursor + elif (len(tool_call_arr) > 0 + and len(tool_call_arr) > self.current_tool_id + 1): + # if we're moving on to a new call, first make sure we + # haven't missed anything in the previous one that was + # auto-generated due to JSON completions, but wasn't + # streamed to the client yet. + # print("starting a new tool in the array, print remaining") + if self.current_tool_id >= 0: + cur_arguments = current_tool_call.get("arguments") + if cur_arguments: + cur_args_json = json.dumps(cur_arguments, ensure_ascii=False) + sent = len( + self.streamed_args_for_tool[self.current_tool_id]) # streamed args for current tool call + argument_diff = cur_args_json[sent:] # args not yet streamed for current tool call + + logger.debug("got arguments diff: %s", argument_diff) + delta = DeltaMessage(tool_calls=[ + DeltaToolCall(index=self.current_tool_id, + function=DeltaFunctionCall( + arguments=argument_diff). + model_dump(exclude_none=True)) + ]) + self.streamed_args_for_tool[ + self.current_tool_id] += argument_diff # update streamed args for current tool call + else: + delta = None + else: + delta = None + # re-set stuff pertaining to progress in the current tool + self.current_tool_id = len(tool_call_arr) - 1 # update current tool call + self.current_tool_name_sent = False + self.streamed_args_for_tool.append("") + logger.debug("starting on new tool %d", self.current_tool_id) + return delta + + # case2: if the current tool name hasn't been sent, send if available + elif not self.current_tool_name_sent: + function_name = current_tool_call.get("name") + if function_name: + delta = DeltaMessage(tool_calls=[ + DeltaToolCall(index=self.current_tool_id, + type="function", + id=f"chatcmpl-tool-{random_uuid()}", + function=DeltaFunctionCall( + name=function_name).model_dump( + exclude_none=True)) + ]) + self.current_tool_name_sent = True + else: + delta = None + + # case3: now we know we're on the same tool call + # and can stream arguments + else: + cur_arguments = current_tool_call.get("arguments") + delta = None + # '{}' 인경우도 출력 해야함. + sent = len( + self.streamed_args_for_tool[self.current_tool_id]) # streamed args for current tool call + cur_args_json = json.dumps(cur_arguments, ensure_ascii=False) + prev_arguments = self.prev_tool_call_arr[ + self.current_tool_id].get("arguments") + argument_diff = None + # if current tool call is complete + if is_complete[self.current_tool_id]: + argument_diff = cur_args_json[sent:] + # if current tool call is not complete and prev_arguments exists + elif prev_arguments: + prev_args_json = json.dumps(prev_arguments, ensure_ascii=False) + if cur_args_json != prev_args_json: + # common prefix betwn prev and current args + prefix = find_common_prefix( + prev_args_json, cur_args_json) + argument_diff = prefix[sent:] + if argument_diff is not None and len(argument_diff) > 0: + delta = DeltaMessage(tool_calls=[ + DeltaToolCall(index=self.current_tool_id, + function=DeltaFunctionCall( + arguments=argument_diff). + model_dump(exclude_none=True)) + ]) + + self.streamed_args_for_tool[ + self.current_tool_id] += argument_diff + # update previous tool call array + self.prev_tool_call_arr = tool_call_arr + return delta + + except Exception as e: + logger.exception("Error trying to handle streaming tool call.") + logger.debug( + "Skipping chunk as a result of tool streaming extraction " + "error") + return None diff --git a/kanana_tool_calls/lmalign_v1.jinja b/kanana_tool_calls/lmalign_v1.jinja new file mode 100644 index 0000000..0afc386 --- /dev/null +++ b/kanana_tool_calls/lmalign_v1.jinja @@ -0,0 +1,320 @@ +{# version=v3-llama3.1 #}{%- macro append_new_param_info(param_declaration, comment_info, examples_info, depth) -%} + {%- set offset = "" -%} + {%- if depth >= 1 -%} + {%- set offset = " " * depth -%} + {%- endif -%} + {%- if comment_info != "<|NONE|>" -%} + {{ "\n" + offset + comment_info }} + {%- if examples_info | length > 0 -%} + {# Append each example info #} + {%- for example in examples_info -%} + {{ "\n" + offset + "// " + example|string|replace("'", '"') }} + {%- endfor -%} + {%- endif -%} + {%- endif -%} + {{ "\n" + offset + param_declaration }} +{%- endmacro -%} + +{%- macro convert_data_type(param_type) -%} + {%- if param_type == "integer" or param_type == "float" -%} + {{ "number" }} + {%- else -%} + {{ param_type }} + {%- endif -%} +{%- endmacro -%} + +{%- macro get_param_type(param) -%} + {%- set param_type = "any" -%} + + {%- if "type" in param -%} + {%- set raw_param_type = param["type"] -%} + {%- if raw_param_type is iterable and raw_param_type is not string -%} + {%- set param_type = raw_param_type | join(" | ") -%} + {%- else -%} + {%- set param_type = raw_param_type -%} + {%- endif -%} + {{ convert_data_type(param_type) }} + {%- elif "oneOf" in param -%} + {%- set one_of_types = param["oneOf"]|selectattr("type", "defined")|list -%} + {%- set one_of_types = one_of_types|map(attribute="type")|unique|list -%} + {{ convert_data_type(one_of_types | join(" | ")) }} + {%- endif -%} +{%- endmacro -%} + +{%- macro get_format_param(param) -%} + {%- if "format" in param -%} + {{ param["format"] }} + {%- elif "oneOf" in param -%} + {%- set formats = [] -%} + {%- for item in param["oneOf"] -%} + {%- if "format" in item -%} + {%- if item["format"] == param["oneOf"][-1]["format"] -%} + {{ item["format"] }} + {%- else -%} + {{ item["format"] + " or "}} + {%- endif -%} + {%- endif -%} + {%- endfor -%} + {%- else -%} + {{ "<|NONE|>" }} + {%- endif -%} +{%- endmacro -%} + +{%- macro get_param_info(param) -%} + {%- set param_type = param.get("type", "any") -%} + {%- set format_param = get_format_param(param) -%} + + {%- if "description" in param or "default" in param or format_param != "<|NONE|>" or param["maximum"] or param["minimum"] or param["maxLength"] or param["minLength"] -%} + {{ "//" }} + {%- if "description" in param -%} + {%- set desc = param["description"] -%} + {%- if not desc.endswith(".") -%} + {%- set desc = desc + "." -%} + {%- endif -%} + {{ " " + desc }} + {%- endif -%} + + {%- if "default" in param -%} + {%- set default_value = param["default"] -%} + {%- if param_type == "string" -%} + {%- set default_value = '"' ~ default_value ~ '"' -%} + {%- endif -%} + {{ " Default=" ~ default_value ~ "." }} + {%- endif -%} + + {%- set format_param = get_format_param(param) -%} + {%- if format_param != "<|NONE|>" -%} + {{ " Format=" ~ format_param }} + {%- endif -%} + + {%- for field, field_name in [("maximum", "Maximum"), ("minimum", "Minimum"), ("maxLength", "Maximum length"), ("minLength", "Minimum length")] -%} + {%- if field in param -%} + {{ " " + field_name ~ "=" ~ param[field] }} + {%- endif -%} + {%- endfor -%} + {%- else -%} + {{ "<|NONE|>"}} + {%- endif -%} +{%- endmacro -%} + +{%- macro get_enum_option_str(enum_options) -%} + {%- for v in enum_options -%} + {%- if v is string -%} + {{ '"' + v + '"' }} + {%- else -%} + {{ v }} + {%- endif -%} + {%- if enum_options|length > 0 and v != enum_options[-1] -%} + {{ " | " }} + {%- endif -%} + {%- endfor -%} +{%- endmacro -%} + +{%- macro get_array_typescript(param_name, param_dic, depth) -%} + {%- set offset = '' -%} + {%- if depth >= 1 -%} + {%- set offset = " " * depth -%} + {%- endif -%} + {%- set items_info = param_dic.get('items', {}) -%} + + {%- if items_info|length == 0 -%} + {%- if param_name -%} + {{ "\n" + offset + param_name + ": []" }} + {%- else -%} + {{ "\n" + offset + "[]" }} + {%- endif -%} + {%- else -%} + {%- set array_type = get_param_type(items_info) -%} + {%- if array_type == 'object' -%} + {%- if param_name -%} + {{ "\n" + offset + param_name + ": {" }} + {%- else -%} + {{ "\n" + offset + "{" }} + {%- endif -%} + {{ get_parameter_typescript(items_info.get('properties', {}), items_info.get('required', []), depth + 1) -}} + {{- "\n" + offset + "}[]" }} + {%- elif array_type == 'array' -%} + {%- set item_info = get_array_typescript(None, items_info, depth + 1) -%} + {%- if not param_name -%} + {{ "\n" + item_info + "[]" }} + {%- else -%} + {{ "\n" + offset + param_name + ": " + item_info|trim + "[]" }} + {%- endif -%} + {%- else -%} + {%- if 'enum' in items_info -%} + {%- set item_type = get_enum_option_str(items_info['enum']) -%} + {%- if param_name is none -%} + {{ "(" + item_type + ")[]"}} + {%- else -%} + {{ "\n" + offset + param_name + ": (" + item_type + ")[]" }} + {%- endif -%} + {%- else -%} + {%- if param_name is none -%} + {{ "\n" + array_type + "[]" }} + {%- else -%} + {{ "\n" + offset + param_name + ": " + array_type + "[]," }} + {%- endif -%} + {%- endif -%} + {%- endif -%} + {%- endif -%} +{%- endmacro -%} + +{%- macro get_parameter_typescript(properties, required_params, depth=0) -%} + {%- set res = "" -%} + {%- for param_name, param in properties.items() -%} + {%- if param is mapping -%} + {%- set comment_info = get_param_info(param) -%} + {# Param Examples #} + {%- set examples_info = [] -%} + {%- if "examples" in param -%} + {%- set examples_info = ["Example " + param_name + ":"] -%} + {%- set examples_info = examples_info + param["examples"] -%} + {%- endif -%} + + {# Param Name declaration #} + {%- set param_declaration = param_name -%} + {%- if required_params is iterable and param_name not in required_params -%} + {%- set param_declaration = param_declaration + "?" -%} + {%- endif -%} + + {%- set param_type = get_param_type(param) -%} + + {# Handle indentation based on depth #} + {%- set offset = "" -%} + {%- if depth >= 1 -%} + {%- set offset = " " * depth -%} + {%- endif -%} + + {%- if param_type == "object" -%} + {%- if comment_info != "<|NONE|>" -%} + {{ "\n" + offset + comment_info }} + {%- endif -%} + {%- if examples_info|length > 0 -%} + {%- for example in examples_info -%} + {{ "\n" + offset + "// " + example|string|replace("'", '"') }} + {%- endfor -%} + {%- endif -%} + {%- set param_declaration = param_declaration + ": {" -%} + {{ "\n" + offset + param_declaration -}} + {{- get_parameter_typescript(param.get("properties", {}), param.get("required", []), depth + 1) -}} + {{- "\n" + offset + "}," }} + {%- elif param_type == "array" -%} + {%- set item_info = param.get("items", {}) -%} + {%- if "type" not in item_info -%} + {%- set param_declaration = param_declaration + ": []," -%} + {{ append_new_param_info(param_declaration, comment_info, examples_info, depth) }} + {%- else -%} + {%- if comment_info != "<|NONE|>" -%} + {{ "\n" + offset + comment_info }} + {%- endif -%} + {%- if examples_info|length > 0 -%} + {%- for example in examples_info -%} + {{ "\n" + offset + "// " + example|string|replace("'", '"') }} + {%- endfor -%} + {%- endif -%} + {%- set array_declaration = get_array_typescript(param_declaration, param, depth) -%} + {%- if not array_declaration.endswith(",") -%} + {%- set array_declaration = array_declaration + "," -%} + {%- endif -%} + {{ array_declaration}} + {%- endif -%} + {%- else -%} + {%- if "enum" in param -%} + {%- set param_type = get_enum_option_str(param["enum"]) -%} + {%- endif -%} + {%- if "nullable" in param and param["nullable"] -%} + {%- set param_type = param_type + " | null" -%} + {%- endif -%} + {%- set param_declaration = param_declaration + ": " + param_type + "," -%} + {{ append_new_param_info(param_declaration, comment_info, examples_info, depth) }} + {%- endif -%} + {%- endif -%} + {%- endfor -%} +{%- endmacro -%} + +{%- macro generate_schema_from_functions(functions, namespace='functions') -%} + {{ "// Supported function definitions that should be called when necessary.\n" -}} + {{- "namespace " + namespace + " {\n\n" -}} + + {%- for function in functions -%} + {%- if function.get("function") -%} + {%- set function = function.get("function") -%} + {%- endif -%} + + {%- set function_name = function.get("name") -%} + {%- if function_name -%} + {%- set description = function.get('description', '') -%} + {%- set parameters = function.get('parameters', {}) -%} + {{- "// " + description + "\n" -}} + {{- "type " + function_name -}} + {%- if parameters and parameters.get("properties") -%} + {{- " = (_: {" -}} + {%- set required_params = parameters.get("required", []) -%} + {{ get_parameter_typescript(parameters.get("properties"), required_params, 0) -}} + {{- "\n}) => any;\n\n" }} + {%- else -%} + {{ " = () => any;\n\n" }} + {%- endif -%} + {%- endif -%} + {%- endfor -%} + {{ "} // namespace " + namespace }} +{%- endmacro -%} +{%- if not tools is defined -%} + {%- set tools = none -%} +{%- endif -%} + +{%- set has_code_interpreter = tools | selectattr("type", "equalto", "code_interpreter") | list | length > 0 -%} +{%- if has_code_interpreter -%} + {%- set tools = tools | rejectattr("type", "equalto", "code_interpreter") | list -%} +{%- endif -%} + +{#- System message + builtin tools #} +{{- bos_token + "<|start_header_id|>system<|end_header_id|>\n\n" }} +{%- if has_code_interpreter %} + {{- "Environment: ipython\n\n" }} +{%- else -%} + {{ "\n"}} +{%- endif %} +{%- if tools %} + {{- "\nYou have access to the following functions:\n\n" }} + {%- for t in tools %} + {%- if "type" in t -%} + {{ "Use the function '" + t["function"]["name"] + "' to '" + t["function"]["description"] + "'\n" + t["function"] | tojson() }} + {%- else -%} + {{ "Use the function '" + t["name"] + "' to '" + t["description"] + "'\n" + t | tojson }} + {%- endif -%} + {{- "\n\n" }} + {%- endfor %} + {{- '\nThink very carefully before calling functions.\nIf a you choose to call a function ONLY reply in the following format:\n<{start_tag}={function_name}>{parameters}{end_tag}\nwhere\n\nstart_tag => ` a JSON dict with the function argument name as key and function argument value as value.\nend_tag => ``\n\nHere is an example,\n{"example_name": "example_value"}\n\nReminder:\n- If looking for real time information use relevant functions before falling back to brave_search\n- Function calls MUST follow the specified format, start with \n- Required parameters MUST be specified\n- Only call one function at a time\n- Put the entire function call reply on one line\n\n' -}} +{%- endif %} +{{- "<|eot_id|>" -}} + +{%- for message in messages -%} + {%- if message['role'] == 'user' or message['role'] == 'system' -%} + {{ '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n' + message['content'] + '<|eot_id|>' }} + {%- elif message['role'] == 'tool' -%} + {{ '<|start_header_id|>ipython<|end_header_id|>\n\n' + message['content'] + '<|eot_id|>' }} + {%- else -%} + {%- if (message['content'] and message['content']|length > 0) or ('tool_calls' in message and message['tool_calls'] and message['tool_calls']|length > 0) -%} + {{ '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'}} + {%- endif -%} + {%- if message['content'] and message['content']|length > 0 -%} + {{ message['content'] }} + {%- endif -%} + {%- if 'tool_calls' in message and message['tool_calls'] and message['tool_calls']|length > 0 -%} + {%- for tool_call in message['tool_calls'] -%} + {%- if tool_call["function"]["name"] == "python" -%} + {{ '<|python_tag|>' + tool_call['function']['arguments']|tojson }} + {%- else -%} + {{ '' + tool_call['function']['arguments']|tojson + '' }} + {%- endif -%} + {%- endfor -%} + {{ '<|eom_id|>' }} + {%- elif message['content'] and message['content']|length > 0 -%} + {{ '<|eot_id|>' }} + {%- endif -%} + {%- endif -%} +{%- endfor -%} +{%- if add_generation_prompt -%} + {{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }} +{%- endif -%} diff --git a/model-00001-of-00007.safetensors b/model-00001-of-00007.safetensors new file mode 100644 index 0000000..8950825 --- /dev/null +++ b/model-00001-of-00007.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dad6208f73ba0cc3888e79b00cca1e1cda31918e7eaa54d4817434fb65e9752 +size 4996655056 diff --git a/model-00002-of-00007.safetensors b/model-00002-of-00007.safetensors new file mode 100644 index 0000000..0b6c1af --- /dev/null +++ b/model-00002-of-00007.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe55eb0566228b34a8048e27ac87be1c3e40707332a9aed5dc20f706b18ed2b8 +size 4996387760 diff --git a/model-00003-of-00007.safetensors b/model-00003-of-00007.safetensors new file mode 100644 index 0000000..c08628e --- /dev/null +++ b/model-00003-of-00007.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5702b956fc53c7794a5ea02c2970ce8f04c74a1df6d30680f0aa6aba0a8f8c9 +size 4997955960 diff --git a/model-00004-of-00007.safetensors b/model-00004-of-00007.safetensors new file mode 100644 index 0000000..845604e --- /dev/null +++ b/model-00004-of-00007.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9028ffca029922250bef1ae796c5dd92ced54c06b1b0928250f0f5884afad0a4 +size 4996092176 diff --git a/model-00005-of-00007.safetensors b/model-00005-of-00007.safetensors new file mode 100644 index 0000000..8597024 --- /dev/null +++ b/model-00005-of-00007.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9169539b4dba1bb628cba22b414664da537aeb497188a7858b9deb6fcf7183ba +size 4996096824 diff --git a/model-00006-of-00007.safetensors b/model-00006-of-00007.safetensors new file mode 100644 index 0000000..33d93c0 --- /dev/null +++ b/model-00006-of-00007.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fe57c4eafa292e8cc26d7b9ed1b7c8d5ba659e824fd5b99fb19096313169432 +size 4996409992 diff --git a/model-00007-of-00007.safetensors b/model-00007-of-00007.safetensors new file mode 100644 index 0000000..ae5cc52 --- /dev/null +++ b/model-00007-of-00007.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5f241156348251c9ed009dad06600725fe2adf85adceb5420bff385fbe9bfb5 +size 1413793632 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000..f048659 --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,6378 @@ +{ + "metadata": { + "total_size": 31392559104 + }, + "weight_map": { + "lm_head.weight": "model-00005-of-00007.safetensors", + "model.embed_tokens.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.0.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.0.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.0.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.1.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.1.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.1.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.10.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.10.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.10.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.11.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.11.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.11.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.12.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.12.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.12.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.13.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.13.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.13.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.14.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.14.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.14.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.15.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.15.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.15.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.16.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.16.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.16.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.17.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.17.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.17.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.18.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.18.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.18.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.19.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.19.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.19.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.2.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.2.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.2.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.20.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.20.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.20.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.21.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.21.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.21.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.22.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.22.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.22.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.23.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.23.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.23.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.24.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.24.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.24.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.25.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.25.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.25.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.26.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.26.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.26.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.27.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.27.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.27.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.28.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.28.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.28.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.29.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.29.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.29.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.3.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.30.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.30.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.30.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.31.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.31.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.31.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.32.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.32.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.32.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.33.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.33.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.33.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.34.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.34.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.34.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.35.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.35.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.35.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.36.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.36.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.36.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.37.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.37.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.37.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.38.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.38.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.38.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.39.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.39.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.39.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.4.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.4.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.4.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.40.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.40.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.40.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.41.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.41.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.41.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.42.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.42.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.42.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.43.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.43.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.43.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.44.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.44.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.44.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.45.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.45.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.45.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.46.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.46.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.46.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.47.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.47.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.47.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.48.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.48.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.48.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.49.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.49.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.49.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.5.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.5.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.5.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.50.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.50.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.50.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.51.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.51.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.51.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.52.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.52.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.52.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.53.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.53.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.53.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.54.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.54.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.54.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.55.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.55.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.55.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.56.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.56.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.56.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.57.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.57.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.57.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.58.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.58.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.58.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.59.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.59.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.59.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.6.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.6.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.6.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.60.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.60.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.60.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.61.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.61.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.61.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.62.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.62.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.62.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.63.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.63.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.63.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.7.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.7.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.7.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.8.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.8.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.8.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.9.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.9.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.0.block_sparse_moe.experts.9.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.0.block_sparse_moe.gate.weight": "model-00005-of-00007.safetensors", + "model.layers.0.input_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.0.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.0.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.0.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.0.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.0.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.1.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.1.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.10.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.10.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.10.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.11.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.11.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.11.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.12.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.12.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.12.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.13.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.13.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.13.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.14.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.14.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.14.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.15.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.15.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.15.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.16.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.16.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.16.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.17.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.17.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.17.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.18.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.18.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.18.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.19.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.19.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.19.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.2.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.20.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.20.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.20.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.21.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.21.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.21.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.22.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.22.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.22.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.23.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.23.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.23.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.24.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.24.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.24.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.25.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.25.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.25.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.26.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.26.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.26.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.27.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.27.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.27.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.28.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.28.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.28.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.29.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.29.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.29.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.3.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.3.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.3.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.30.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.30.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.30.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.31.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.31.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.31.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.32.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.32.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.32.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.33.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.33.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.33.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.34.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.34.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.34.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.35.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.35.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.35.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.36.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.36.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.36.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.37.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.37.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.37.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.38.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.38.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.38.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.39.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.39.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.39.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.4.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.4.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.40.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.40.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.40.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.41.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.41.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.41.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.42.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.42.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.42.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.43.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.43.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.43.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.44.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.44.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.44.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.45.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.45.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.45.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.46.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.46.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.46.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.47.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.47.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.47.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.48.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.48.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.48.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.49.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.49.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.49.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.5.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.5.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.5.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.50.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.50.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.50.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.51.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.51.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.51.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.52.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.52.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.52.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.53.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.53.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.53.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.54.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.54.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.54.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.55.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.55.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.55.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.56.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.56.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.56.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.57.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.57.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.57.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.58.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.58.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.58.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.59.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.59.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.59.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.6.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.6.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.60.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.60.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.60.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.61.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.61.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.61.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.62.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.62.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.62.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.63.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.63.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.63.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.7.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.8.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.8.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.8.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.9.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.9.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.1.block_sparse_moe.experts.9.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.1.block_sparse_moe.gate.weight": "model-00001-of-00007.safetensors", + "model.layers.1.input_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.1.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.1.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.1.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.0.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.0.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.0.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.1.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.1.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.1.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.10.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.10.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.10.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.11.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.11.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.11.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.12.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.12.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.12.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.13.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.13.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.13.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.14.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.14.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.14.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.15.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.15.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.15.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.16.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.16.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.16.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.17.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.17.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.17.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.18.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.18.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.18.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.19.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.19.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.19.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.2.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.2.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.2.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.20.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.20.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.20.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.21.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.21.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.21.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.22.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.22.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.22.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.23.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.23.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.23.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.24.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.24.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.24.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.25.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.25.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.25.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.26.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.26.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.26.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.27.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.27.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.27.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.28.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.28.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.28.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.29.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.29.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.29.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.3.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.3.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.3.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.30.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.30.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.30.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.31.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.31.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.31.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.32.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.32.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.32.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.33.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.33.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.33.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.34.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.34.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.34.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.35.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.35.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.35.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.36.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.36.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.36.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.37.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.37.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.37.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.38.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.38.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.38.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.39.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.39.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.39.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.4.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.4.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.40.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.40.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.40.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.41.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.41.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.41.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.42.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.42.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.42.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.43.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.43.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.43.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.44.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.44.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.44.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.45.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.45.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.45.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.46.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.46.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.46.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.47.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.47.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.47.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.48.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.48.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.48.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.49.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.49.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.49.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.5.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.5.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.5.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.50.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.50.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.50.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.51.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.51.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.51.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.52.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.52.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.52.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.53.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.53.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.53.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.54.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.54.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.54.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.55.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.55.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.55.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.56.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.56.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.56.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.57.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.57.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.57.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.58.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.58.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.58.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.59.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.59.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.59.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.6.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.6.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.6.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.60.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.60.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.60.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.61.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.61.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.61.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.62.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.62.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.62.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.63.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.63.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.63.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.7.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.7.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.8.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.8.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.8.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.9.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.9.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.10.block_sparse_moe.experts.9.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.10.block_sparse_moe.gate.weight": "model-00003-of-00007.safetensors", + "model.layers.10.input_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.10.self_attn.k_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.10.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.10.self_attn.v_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.0.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.0.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.0.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.1.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.1.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.10.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.10.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.10.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.11.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.11.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.11.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.12.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.12.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.12.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.13.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.13.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.13.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.14.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.14.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.14.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.15.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.15.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.15.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.16.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.16.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.16.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.17.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.17.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.17.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.18.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.18.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.18.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.19.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.19.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.19.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.2.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.2.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.20.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.20.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.20.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.21.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.21.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.21.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.22.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.22.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.22.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.23.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.23.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.23.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.24.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.24.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.24.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.25.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.25.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.25.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.26.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.26.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.26.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.27.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.27.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.27.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.28.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.28.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.28.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.29.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.29.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.29.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.3.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.3.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.30.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.30.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.30.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.31.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.31.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.31.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.32.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.32.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.32.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.33.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.33.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.33.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.34.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.34.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.34.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.35.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.35.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.35.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.36.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.36.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.36.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.37.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.37.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.37.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.38.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.38.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.38.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.39.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.39.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.39.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.4.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.4.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.4.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.40.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.40.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.40.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.41.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.41.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.41.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.42.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.42.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.42.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.43.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.43.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.43.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.44.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.44.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.44.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.45.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.45.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.45.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.46.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.46.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.46.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.47.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.47.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.47.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.48.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.48.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.48.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.49.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.49.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.49.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.5.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.5.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.50.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.50.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.50.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.51.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.51.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.51.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.52.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.52.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.52.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.53.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.53.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.53.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.54.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.54.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.54.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.55.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.55.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.55.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.56.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.56.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.56.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.57.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.57.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.57.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.58.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.58.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.58.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.59.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.59.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.59.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.6.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.6.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.60.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.60.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.60.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.61.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.61.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.61.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.62.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.62.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.62.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.63.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.63.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.63.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.7.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.7.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.7.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.8.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.8.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.8.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.9.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.9.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.11.block_sparse_moe.experts.9.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.11.block_sparse_moe.gate.weight": "model-00006-of-00007.safetensors", + "model.layers.11.input_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.11.self_attn.k_proj.weight": "model-00007-of-00007.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.11.self_attn.q_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.11.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.0.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.0.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.0.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.1.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.1.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.1.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.10.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.10.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.10.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.11.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.11.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.11.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.12.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.12.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.12.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.13.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.13.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.13.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.14.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.14.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.14.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.15.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.15.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.15.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.16.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.16.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.16.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.17.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.17.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.17.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.18.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.18.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.18.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.19.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.19.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.19.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.2.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.2.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.2.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.20.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.20.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.20.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.21.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.21.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.21.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.22.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.22.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.22.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.23.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.23.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.23.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.24.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.24.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.24.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.25.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.25.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.25.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.26.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.26.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.26.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.27.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.27.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.27.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.28.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.28.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.28.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.29.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.29.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.29.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.3.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.3.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.3.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.30.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.30.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.30.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.31.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.31.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.31.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.32.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.32.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.32.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.33.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.33.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.33.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.34.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.34.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.34.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.35.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.35.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.35.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.36.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.36.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.36.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.37.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.37.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.37.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.38.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.38.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.38.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.39.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.39.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.39.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.4.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.4.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.40.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.40.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.40.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.41.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.41.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.41.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.42.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.42.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.42.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.43.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.43.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.43.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.44.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.44.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.44.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.45.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.45.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.45.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.46.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.46.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.46.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.47.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.47.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.47.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.48.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.48.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.48.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.49.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.49.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.49.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.5.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.50.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.50.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.50.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.51.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.51.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.51.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.52.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.52.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.52.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.53.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.53.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.53.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.54.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.54.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.54.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.55.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.55.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.55.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.56.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.56.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.56.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.57.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.57.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.57.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.58.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.58.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.58.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.59.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.59.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.59.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.6.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.6.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.60.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.60.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.60.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.61.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.61.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.61.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.62.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.62.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.62.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.63.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.63.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.63.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.7.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.7.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.7.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.8.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.8.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.8.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.9.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.9.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.12.block_sparse_moe.experts.9.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.12.block_sparse_moe.gate.weight": "model-00003-of-00007.safetensors", + "model.layers.12.input_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00005-of-00007.safetensors", + "model.layers.12.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.12.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.12.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.0.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.0.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.0.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.1.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.1.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.10.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.10.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.10.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.11.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.11.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.11.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.12.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.12.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.12.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.13.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.13.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.13.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.14.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.14.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.14.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.15.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.15.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.15.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.16.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.16.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.16.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.17.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.17.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.17.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.18.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.18.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.18.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.19.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.19.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.19.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.2.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.2.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.2.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.20.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.20.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.20.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.21.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.21.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.21.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.22.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.22.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.22.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.23.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.23.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.23.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.24.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.24.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.24.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.25.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.25.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.25.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.26.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.26.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.26.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.27.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.27.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.27.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.28.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.28.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.28.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.29.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.29.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.29.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.3.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.3.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.30.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.30.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.30.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.31.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.31.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.31.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.32.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.32.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.32.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.33.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.33.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.33.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.34.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.34.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.34.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.35.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.35.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.35.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.36.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.36.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.36.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.37.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.37.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.37.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.38.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.38.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.38.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.39.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.39.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.39.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.4.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.4.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.4.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.40.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.40.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.40.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.41.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.41.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.41.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.42.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.42.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.42.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.43.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.43.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.43.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.44.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.44.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.44.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.45.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.45.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.45.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.46.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.46.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.46.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.47.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.47.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.47.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.48.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.48.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.48.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.49.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.49.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.49.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.5.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.5.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.5.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.50.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.50.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.50.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.51.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.51.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.51.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.52.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.52.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.52.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.53.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.53.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.53.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.54.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.54.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.54.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.55.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.55.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.55.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.56.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.56.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.56.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.57.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.57.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.57.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.58.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.58.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.58.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.59.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.59.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.59.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.6.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.60.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.60.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.60.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.61.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.61.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.61.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.62.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.62.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.62.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.63.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.63.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.63.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.7.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.7.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.7.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.8.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.8.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.8.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.9.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.9.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.13.block_sparse_moe.experts.9.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.13.block_sparse_moe.gate.weight": "model-00001-of-00007.safetensors", + "model.layers.13.input_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.13.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.13.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.13.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.0.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.0.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.0.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.1.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.1.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.1.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.10.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.10.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.10.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.11.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.11.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.11.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.12.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.12.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.12.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.13.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.13.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.13.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.14.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.14.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.14.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.15.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.15.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.15.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.16.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.16.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.16.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.17.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.17.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.17.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.18.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.18.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.18.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.19.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.19.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.19.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.2.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.2.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.20.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.20.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.20.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.21.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.21.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.21.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.22.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.22.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.22.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.23.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.23.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.23.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.24.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.24.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.24.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.25.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.25.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.25.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.26.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.26.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.26.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.27.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.27.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.27.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.28.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.28.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.28.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.29.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.29.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.29.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.3.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.3.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.3.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.30.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.30.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.30.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.31.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.31.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.31.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.32.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.32.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.32.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.33.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.33.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.33.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.34.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.34.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.34.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.35.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.35.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.35.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.36.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.36.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.36.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.37.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.37.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.37.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.38.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.38.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.38.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.39.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.39.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.39.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.4.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.4.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.4.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.40.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.40.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.40.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.41.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.41.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.41.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.42.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.42.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.42.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.43.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.43.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.43.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.44.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.44.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.44.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.45.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.45.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.45.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.46.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.46.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.46.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.47.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.47.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.47.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.48.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.48.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.48.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.49.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.49.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.49.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.5.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.5.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.50.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.50.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.50.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.51.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.51.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.51.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.52.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.52.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.52.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.53.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.53.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.53.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.54.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.54.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.54.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.55.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.55.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.55.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.56.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.56.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.56.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.57.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.57.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.57.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.58.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.58.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.58.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.59.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.59.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.59.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.6.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.6.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.60.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.60.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.60.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.61.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.61.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.61.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.62.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.62.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.62.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.63.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.63.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.63.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.7.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.7.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.7.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.8.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.8.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.8.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.9.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.9.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.14.block_sparse_moe.experts.9.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.14.block_sparse_moe.gate.weight": "model-00002-of-00007.safetensors", + "model.layers.14.input_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00007-of-00007.safetensors", + "model.layers.14.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.14.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.14.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.0.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.0.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.0.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.1.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.1.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.1.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.10.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.10.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.10.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.11.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.11.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.11.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.12.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.12.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.12.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.13.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.13.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.13.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.14.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.14.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.14.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.15.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.15.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.15.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.16.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.16.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.16.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.17.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.17.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.17.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.18.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.18.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.18.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.19.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.19.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.19.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.2.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.2.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.2.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.20.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.20.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.20.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.21.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.21.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.21.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.22.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.22.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.22.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.23.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.23.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.23.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.24.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.24.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.24.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.25.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.25.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.25.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.26.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.26.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.26.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.27.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.27.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.27.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.28.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.28.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.28.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.29.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.29.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.29.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.3.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.3.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.3.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.30.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.30.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.30.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.31.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.31.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.31.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.32.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.32.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.32.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.33.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.33.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.33.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.34.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.34.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.34.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.35.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.35.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.35.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.36.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.36.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.36.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.37.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.37.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.37.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.38.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.38.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.38.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.39.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.39.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.39.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.40.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.40.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.40.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.41.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.41.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.41.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.42.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.42.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.42.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.43.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.43.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.43.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.44.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.44.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.44.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.45.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.45.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.45.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.46.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.46.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.46.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.47.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.47.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.47.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.48.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.48.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.48.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.49.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.49.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.49.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.5.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.5.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.5.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.50.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.50.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.50.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.51.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.51.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.51.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.52.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.52.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.52.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.53.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.53.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.53.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.54.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.54.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.54.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.55.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.55.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.55.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.56.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.56.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.56.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.57.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.57.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.57.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.58.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.58.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.58.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.59.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.59.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.59.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.6.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.6.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.6.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.60.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.60.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.60.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.61.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.61.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.61.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.62.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.62.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.62.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.63.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.63.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.63.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.7.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.7.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.7.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.8.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.8.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.8.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.9.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.9.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.15.block_sparse_moe.experts.9.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.15.block_sparse_moe.gate.weight": "model-00002-of-00007.safetensors", + "model.layers.15.input_layernorm.weight": "model-00005-of-00007.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.15.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.15.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.15.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.0.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.0.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.0.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.1.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.1.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.10.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.10.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.10.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.11.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.11.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.11.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.12.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.12.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.12.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.13.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.13.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.13.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.14.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.14.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.14.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.15.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.15.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.15.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.16.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.16.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.16.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.17.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.17.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.17.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.18.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.18.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.18.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.19.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.19.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.19.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.2.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.2.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.20.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.20.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.20.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.21.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.21.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.21.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.22.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.22.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.22.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.23.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.23.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.23.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.24.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.24.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.24.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.25.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.25.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.25.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.26.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.26.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.26.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.27.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.27.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.27.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.28.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.28.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.28.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.29.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.29.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.29.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.3.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.3.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.30.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.30.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.30.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.31.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.31.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.31.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.32.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.32.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.32.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.33.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.33.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.33.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.34.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.34.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.34.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.35.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.35.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.35.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.36.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.36.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.36.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.37.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.37.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.37.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.38.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.38.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.38.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.39.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.39.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.39.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.4.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.4.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.4.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.40.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.40.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.40.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.41.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.41.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.41.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.42.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.42.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.42.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.43.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.43.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.43.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.44.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.44.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.44.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.45.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.45.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.45.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.46.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.46.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.46.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.47.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.47.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.47.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.48.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.48.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.48.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.49.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.49.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.49.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.5.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.5.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.50.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.50.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.50.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.51.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.51.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.51.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.52.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.52.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.52.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.53.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.53.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.53.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.54.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.54.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.54.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.55.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.55.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.55.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.56.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.56.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.56.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.57.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.57.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.57.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.58.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.58.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.58.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.59.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.59.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.59.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.6.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.6.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.60.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.60.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.60.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.61.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.61.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.61.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.62.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.62.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.62.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.63.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.63.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.63.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.7.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.7.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.7.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.8.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.8.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.8.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.9.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.9.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.16.block_sparse_moe.experts.9.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.16.block_sparse_moe.gate.weight": "model-00002-of-00007.safetensors", + "model.layers.16.input_layernorm.weight": "model-00007-of-00007.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.16.self_attn.k_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.16.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.16.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.0.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.0.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.1.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.1.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.1.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.10.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.10.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.10.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.11.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.11.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.11.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.12.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.12.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.12.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.13.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.13.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.13.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.14.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.14.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.14.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.15.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.15.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.15.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.16.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.16.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.16.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.17.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.17.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.17.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.18.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.18.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.18.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.19.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.19.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.19.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.2.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.2.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.2.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.20.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.20.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.20.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.21.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.21.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.21.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.22.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.22.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.22.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.23.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.23.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.23.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.24.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.24.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.24.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.25.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.25.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.25.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.26.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.26.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.26.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.27.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.27.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.27.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.28.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.28.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.28.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.29.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.29.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.29.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.3.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.3.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.3.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.30.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.30.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.30.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.31.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.31.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.31.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.32.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.32.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.32.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.33.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.33.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.33.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.34.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.34.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.34.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.35.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.35.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.35.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.36.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.36.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.36.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.37.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.37.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.37.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.38.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.38.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.38.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.39.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.39.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.39.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.4.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.4.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.4.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.40.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.40.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.40.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.41.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.41.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.41.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.42.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.42.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.42.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.43.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.43.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.43.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.44.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.44.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.44.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.45.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.45.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.45.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.46.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.46.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.46.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.47.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.47.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.47.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.48.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.48.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.48.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.49.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.49.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.49.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.5.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.5.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.50.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.50.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.50.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.51.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.51.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.51.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.52.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.52.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.52.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.53.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.53.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.53.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.54.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.54.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.54.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.55.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.55.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.55.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.56.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.56.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.56.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.57.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.57.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.57.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.58.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.58.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.58.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.59.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.59.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.59.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.6.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.6.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.60.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.60.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.60.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.61.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.61.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.61.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.62.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.62.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.62.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.63.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.63.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.63.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.7.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.7.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.8.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.8.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.8.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.9.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.9.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.17.block_sparse_moe.experts.9.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.17.block_sparse_moe.gate.weight": "model-00007-of-00007.safetensors", + "model.layers.17.input_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.17.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.17.self_attn.q_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.17.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.0.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.0.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.0.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.1.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.10.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.10.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.10.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.11.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.11.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.11.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.12.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.12.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.12.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.13.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.13.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.13.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.14.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.14.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.14.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.15.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.15.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.15.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.16.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.16.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.16.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.17.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.17.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.17.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.18.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.18.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.18.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.19.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.19.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.19.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.2.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.2.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.2.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.20.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.20.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.20.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.21.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.21.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.21.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.22.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.22.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.22.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.23.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.23.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.23.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.24.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.24.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.24.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.25.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.25.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.25.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.26.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.26.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.26.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.27.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.27.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.27.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.28.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.28.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.28.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.29.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.29.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.29.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.3.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.3.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.3.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.30.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.30.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.30.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.31.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.31.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.31.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.32.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.32.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.32.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.33.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.33.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.33.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.34.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.34.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.34.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.35.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.35.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.35.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.36.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.36.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.36.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.37.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.37.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.37.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.38.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.38.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.38.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.39.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.39.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.39.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.4.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.4.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.40.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.40.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.40.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.41.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.41.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.41.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.42.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.42.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.42.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.43.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.43.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.43.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.44.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.44.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.44.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.45.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.45.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.45.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.46.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.46.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.46.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.47.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.47.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.47.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.48.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.48.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.48.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.49.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.49.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.49.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.5.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.5.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.5.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.50.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.50.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.50.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.51.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.51.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.51.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.52.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.52.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.52.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.53.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.53.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.53.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.54.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.54.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.54.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.55.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.55.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.55.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.56.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.56.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.56.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.57.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.57.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.57.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.58.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.58.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.58.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.59.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.59.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.59.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.6.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.6.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.60.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.60.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.60.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.61.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.61.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.61.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.62.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.62.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.62.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.63.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.63.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.63.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.7.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.7.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.7.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.8.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.8.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.8.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.9.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.9.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.experts.9.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.18.block_sparse_moe.gate.weight": "model-00003-of-00007.safetensors", + "model.layers.18.input_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.18.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.18.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.18.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.0.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.1.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.1.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.1.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.10.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.10.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.10.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.11.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.11.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.11.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.12.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.12.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.12.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.13.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.13.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.13.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.14.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.14.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.14.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.15.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.15.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.15.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.16.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.16.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.16.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.17.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.17.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.17.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.18.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.18.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.18.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.19.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.19.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.19.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.2.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.2.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.2.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.20.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.20.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.20.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.21.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.21.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.21.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.22.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.22.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.22.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.23.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.23.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.23.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.24.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.24.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.24.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.25.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.25.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.25.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.26.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.26.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.26.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.27.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.27.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.27.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.28.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.28.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.28.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.29.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.29.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.29.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.3.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.3.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.3.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.30.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.30.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.30.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.31.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.31.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.31.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.32.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.32.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.32.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.33.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.33.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.33.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.34.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.34.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.34.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.35.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.35.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.35.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.36.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.36.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.36.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.37.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.37.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.37.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.38.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.38.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.38.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.39.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.39.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.39.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.4.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.4.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.4.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.40.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.40.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.40.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.41.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.41.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.41.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.42.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.42.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.42.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.43.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.43.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.43.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.44.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.44.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.44.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.45.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.45.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.45.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.46.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.46.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.46.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.47.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.47.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.47.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.48.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.48.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.48.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.49.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.49.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.49.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.5.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.5.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.5.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.50.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.50.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.50.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.51.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.51.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.51.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.52.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.52.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.52.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.53.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.53.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.53.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.54.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.54.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.54.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.55.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.55.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.55.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.56.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.56.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.56.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.57.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.57.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.57.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.58.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.58.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.58.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.59.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.59.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.59.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.6.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.6.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.6.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.60.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.60.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.60.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.61.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.61.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.61.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.62.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.62.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.62.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.63.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.63.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.63.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.7.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.7.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.7.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.8.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.8.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.8.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.9.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.9.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.19.block_sparse_moe.experts.9.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.19.block_sparse_moe.gate.weight": "model-00004-of-00007.safetensors", + "model.layers.19.input_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.19.self_attn.k_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.19.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.19.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.0.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.0.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.0.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.1.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.1.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.10.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.10.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.10.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.11.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.11.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.11.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.12.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.12.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.12.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.13.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.13.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.13.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.14.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.14.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.14.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.15.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.15.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.15.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.16.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.16.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.16.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.17.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.17.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.17.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.18.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.18.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.18.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.19.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.19.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.19.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.2.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.2.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.20.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.20.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.20.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.21.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.21.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.21.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.22.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.22.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.22.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.23.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.23.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.23.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.24.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.24.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.24.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.25.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.25.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.25.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.26.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.26.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.26.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.27.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.27.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.27.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.28.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.28.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.28.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.29.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.29.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.29.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.3.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.30.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.30.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.30.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.31.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.31.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.31.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.32.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.32.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.32.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.33.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.33.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.33.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.34.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.34.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.34.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.35.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.35.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.35.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.36.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.36.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.36.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.37.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.37.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.37.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.38.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.38.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.38.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.39.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.39.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.39.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.4.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.4.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.4.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.40.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.40.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.40.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.41.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.41.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.41.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.42.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.42.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.42.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.43.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.43.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.43.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.44.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.44.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.44.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.45.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.45.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.45.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.46.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.46.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.46.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.47.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.47.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.47.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.48.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.48.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.48.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.49.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.49.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.49.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.5.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.5.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.5.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.50.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.50.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.50.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.51.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.51.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.51.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.52.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.52.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.52.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.53.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.53.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.53.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.54.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.54.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.54.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.55.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.55.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.55.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.56.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.56.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.56.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.57.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.57.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.57.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.58.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.58.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.58.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.59.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.59.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.59.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.6.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.6.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.6.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.60.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.60.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.60.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.61.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.61.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.61.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.62.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.62.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.62.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.63.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.63.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.63.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.7.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.7.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.8.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.8.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.8.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.9.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.9.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.2.block_sparse_moe.experts.9.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.2.block_sparse_moe.gate.weight": "model-00005-of-00007.safetensors", + "model.layers.2.input_layernorm.weight": "model-00004-of-00007.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.2.self_attn.k_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00007-of-00007.safetensors", + "model.layers.2.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.2.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.0.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.0.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.0.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.1.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.1.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.10.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.10.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.10.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.11.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.11.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.11.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.12.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.12.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.12.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.13.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.13.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.13.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.14.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.14.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.14.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.15.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.15.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.15.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.16.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.16.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.16.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.17.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.17.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.17.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.18.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.18.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.18.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.19.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.19.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.19.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.2.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.2.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.2.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.20.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.20.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.20.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.21.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.21.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.21.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.22.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.22.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.22.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.23.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.23.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.23.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.24.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.24.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.24.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.25.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.25.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.25.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.26.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.26.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.26.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.27.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.27.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.27.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.28.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.28.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.28.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.29.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.29.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.29.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.3.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.3.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.30.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.30.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.30.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.31.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.31.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.31.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.32.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.32.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.32.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.33.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.33.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.33.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.34.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.34.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.34.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.35.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.35.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.35.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.36.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.36.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.36.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.37.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.37.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.37.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.38.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.38.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.38.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.39.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.39.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.39.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.4.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.4.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.4.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.40.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.40.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.40.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.41.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.41.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.41.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.42.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.42.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.42.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.43.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.43.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.43.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.44.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.44.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.44.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.45.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.45.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.45.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.46.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.46.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.46.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.47.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.47.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.47.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.48.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.48.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.48.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.49.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.49.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.49.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.5.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.5.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.5.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.50.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.50.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.50.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.51.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.51.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.51.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.52.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.52.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.52.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.53.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.53.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.53.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.54.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.54.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.54.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.55.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.55.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.55.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.56.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.56.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.56.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.57.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.57.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.57.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.58.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.58.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.58.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.59.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.59.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.59.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.6.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.6.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.6.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.60.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.60.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.60.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.61.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.61.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.61.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.62.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.62.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.62.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.63.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.63.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.63.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.7.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.7.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.8.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.8.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.8.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.9.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.9.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.20.block_sparse_moe.experts.9.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.20.block_sparse_moe.gate.weight": "model-00001-of-00007.safetensors", + "model.layers.20.input_layernorm.weight": "model-00007-of-00007.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.20.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.20.self_attn.q_proj.weight": "model-00007-of-00007.safetensors", + "model.layers.20.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.0.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.0.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.0.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.1.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.1.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.10.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.10.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.10.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.11.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.11.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.11.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.12.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.12.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.12.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.13.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.13.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.13.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.14.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.14.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.14.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.15.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.15.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.15.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.16.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.16.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.16.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.17.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.17.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.17.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.18.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.18.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.18.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.19.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.19.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.19.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.2.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.2.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.2.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.20.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.20.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.20.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.21.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.21.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.21.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.22.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.22.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.22.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.23.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.23.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.23.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.24.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.24.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.24.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.25.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.25.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.25.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.26.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.26.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.26.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.27.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.27.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.27.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.28.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.28.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.28.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.29.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.29.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.29.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.3.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.3.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.30.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.30.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.30.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.31.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.31.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.31.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.32.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.32.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.32.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.33.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.33.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.33.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.34.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.34.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.34.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.35.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.35.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.35.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.36.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.36.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.36.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.37.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.37.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.37.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.38.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.38.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.38.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.39.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.39.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.39.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.4.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.4.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.4.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.40.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.40.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.40.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.41.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.41.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.41.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.42.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.42.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.42.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.43.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.43.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.43.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.44.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.44.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.44.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.45.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.45.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.45.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.46.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.46.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.46.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.47.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.47.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.47.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.48.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.48.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.48.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.49.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.49.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.49.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.5.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.5.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.50.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.50.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.50.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.51.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.51.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.51.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.52.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.52.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.52.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.53.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.53.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.53.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.54.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.54.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.54.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.55.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.55.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.55.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.56.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.56.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.56.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.57.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.57.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.57.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.58.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.58.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.58.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.59.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.59.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.59.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.6.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.6.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.6.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.60.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.60.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.60.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.61.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.61.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.61.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.62.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.62.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.62.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.63.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.63.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.63.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.7.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.7.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.7.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.8.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.8.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.8.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.9.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.9.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.21.block_sparse_moe.experts.9.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.21.block_sparse_moe.gate.weight": "model-00001-of-00007.safetensors", + "model.layers.21.input_layernorm.weight": "model-00004-of-00007.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.21.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.21.self_attn.q_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.21.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.0.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.0.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.0.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.1.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.1.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.1.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.10.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.10.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.10.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.11.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.11.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.11.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.12.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.12.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.12.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.13.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.13.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.13.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.14.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.14.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.14.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.15.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.15.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.15.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.16.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.16.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.16.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.17.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.17.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.17.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.18.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.18.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.18.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.19.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.19.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.19.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.2.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.2.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.2.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.20.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.20.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.20.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.21.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.21.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.21.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.22.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.22.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.22.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.23.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.23.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.23.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.24.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.24.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.24.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.25.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.25.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.25.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.26.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.26.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.26.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.27.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.27.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.27.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.28.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.28.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.28.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.29.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.29.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.29.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.3.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.3.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.3.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.30.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.30.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.30.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.31.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.31.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.31.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.32.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.32.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.32.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.33.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.33.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.33.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.34.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.34.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.34.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.35.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.35.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.35.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.36.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.36.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.36.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.37.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.37.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.37.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.38.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.38.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.38.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.39.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.39.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.39.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.4.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.4.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.4.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.40.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.40.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.40.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.41.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.41.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.41.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.42.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.42.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.42.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.43.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.43.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.43.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.44.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.44.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.44.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.45.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.45.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.45.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.46.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.46.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.46.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.47.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.47.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.47.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.48.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.48.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.48.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.49.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.49.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.49.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.5.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.50.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.50.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.50.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.51.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.51.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.51.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.52.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.52.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.52.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.53.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.53.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.53.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.54.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.54.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.54.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.55.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.55.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.55.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.56.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.56.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.56.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.57.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.57.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.57.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.58.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.58.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.58.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.59.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.59.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.59.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.6.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.6.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.60.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.60.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.60.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.61.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.61.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.61.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.62.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.62.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.62.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.63.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.63.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.63.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.7.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.7.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.8.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.8.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.8.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.9.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.9.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.22.block_sparse_moe.experts.9.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.22.block_sparse_moe.gate.weight": "model-00001-of-00007.safetensors", + "model.layers.22.input_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.22.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.22.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.22.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.0.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.1.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.1.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.1.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.10.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.10.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.10.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.11.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.11.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.11.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.12.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.12.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.12.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.13.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.13.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.13.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.14.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.14.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.14.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.15.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.15.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.15.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.16.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.16.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.16.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.17.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.17.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.17.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.18.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.18.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.18.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.19.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.19.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.19.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.2.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.2.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.2.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.20.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.20.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.20.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.21.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.21.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.21.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.22.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.22.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.22.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.23.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.23.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.23.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.24.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.24.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.24.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.25.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.25.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.25.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.26.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.26.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.26.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.27.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.27.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.27.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.28.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.28.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.28.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.29.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.29.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.29.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.3.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.3.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.30.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.30.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.30.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.31.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.31.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.31.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.32.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.32.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.32.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.33.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.33.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.33.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.34.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.34.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.34.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.35.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.35.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.35.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.36.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.36.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.36.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.37.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.37.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.37.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.38.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.38.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.38.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.39.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.39.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.39.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.4.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.4.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.4.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.40.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.40.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.40.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.41.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.41.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.41.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.42.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.42.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.42.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.43.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.43.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.43.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.44.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.44.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.44.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.45.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.45.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.45.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.46.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.46.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.46.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.47.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.47.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.47.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.48.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.48.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.48.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.49.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.49.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.49.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.5.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.5.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.50.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.50.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.50.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.51.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.51.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.51.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.52.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.52.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.52.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.53.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.53.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.53.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.54.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.54.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.54.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.55.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.55.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.55.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.56.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.56.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.56.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.57.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.57.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.57.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.58.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.58.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.58.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.59.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.59.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.59.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.6.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.6.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.6.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.60.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.60.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.60.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.61.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.61.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.61.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.62.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.62.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.62.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.63.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.63.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.63.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.7.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.7.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.8.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.8.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.8.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.9.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.9.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.experts.9.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.23.block_sparse_moe.gate.weight": "model-00005-of-00007.safetensors", + "model.layers.23.input_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.23.self_attn.k_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.23.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.23.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.0.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.0.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.0.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.1.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.1.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.1.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.10.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.10.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.10.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.11.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.11.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.11.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.12.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.12.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.12.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.13.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.13.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.13.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.14.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.14.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.14.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.15.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.15.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.15.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.16.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.16.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.16.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.17.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.17.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.17.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.18.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.18.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.18.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.19.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.19.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.19.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.20.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.20.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.20.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.21.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.21.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.21.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.22.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.22.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.22.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.23.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.23.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.23.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.24.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.24.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.24.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.25.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.25.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.25.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.26.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.26.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.26.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.27.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.27.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.27.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.28.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.28.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.28.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.29.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.29.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.29.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.3.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.3.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.30.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.30.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.30.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.31.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.31.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.31.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.32.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.32.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.32.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.33.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.33.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.33.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.34.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.34.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.34.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.35.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.35.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.35.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.36.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.36.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.36.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.37.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.37.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.37.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.38.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.38.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.38.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.39.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.39.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.39.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.4.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.4.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.40.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.40.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.40.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.41.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.41.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.41.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.42.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.42.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.42.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.43.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.43.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.43.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.44.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.44.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.44.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.45.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.45.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.45.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.46.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.46.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.46.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.47.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.47.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.47.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.48.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.48.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.48.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.49.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.49.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.49.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.5.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.5.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.50.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.50.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.50.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.51.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.51.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.51.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.52.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.52.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.52.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.53.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.53.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.53.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.54.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.54.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.54.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.55.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.55.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.55.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.56.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.56.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.56.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.57.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.57.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.57.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.58.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.58.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.58.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.59.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.59.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.59.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.6.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.6.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.60.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.60.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.60.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.61.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.61.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.61.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.62.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.62.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.62.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.63.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.63.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.63.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.7.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.7.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.7.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.8.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.8.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.8.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.9.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.9.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.24.block_sparse_moe.experts.9.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.24.block_sparse_moe.gate.weight": "model-00005-of-00007.safetensors", + "model.layers.24.input_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.24.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.24.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.24.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.0.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.0.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.0.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.1.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.1.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.10.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.10.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.10.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.11.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.11.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.11.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.12.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.12.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.12.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.13.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.13.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.13.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.14.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.14.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.14.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.15.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.15.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.15.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.16.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.16.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.16.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.17.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.17.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.17.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.18.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.18.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.18.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.19.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.19.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.19.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.2.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.2.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.2.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.20.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.20.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.20.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.21.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.21.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.21.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.22.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.22.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.22.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.23.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.23.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.23.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.24.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.24.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.24.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.25.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.25.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.25.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.26.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.26.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.26.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.27.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.27.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.27.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.28.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.28.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.28.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.29.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.29.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.29.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.3.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.3.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.3.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.30.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.30.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.30.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.31.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.31.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.31.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.32.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.32.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.32.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.33.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.33.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.33.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.34.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.34.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.34.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.35.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.35.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.35.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.36.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.36.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.36.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.37.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.37.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.37.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.38.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.38.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.38.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.39.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.39.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.39.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.4.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.4.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.4.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.40.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.40.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.40.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.41.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.41.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.41.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.42.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.42.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.42.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.43.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.43.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.43.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.44.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.44.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.44.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.45.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.45.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.45.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.46.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.46.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.46.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.47.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.47.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.47.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.48.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.48.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.48.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.49.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.49.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.49.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.5.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.5.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.5.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.50.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.50.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.50.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.51.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.51.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.51.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.52.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.52.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.52.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.53.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.53.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.53.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.54.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.54.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.54.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.55.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.55.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.55.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.56.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.56.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.56.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.57.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.57.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.57.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.58.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.58.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.58.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.59.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.59.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.59.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.6.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.6.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.60.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.60.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.60.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.61.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.61.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.61.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.62.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.62.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.62.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.63.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.63.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.63.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.7.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.7.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.7.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.8.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.8.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.8.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.9.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.9.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.25.block_sparse_moe.experts.9.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.25.block_sparse_moe.gate.weight": "model-00002-of-00007.safetensors", + "model.layers.25.input_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00005-of-00007.safetensors", + "model.layers.25.self_attn.k_proj.weight": "model-00007-of-00007.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.25.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.25.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.0.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.0.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.1.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.1.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.10.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.10.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.10.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.11.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.11.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.11.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.12.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.12.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.12.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.13.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.13.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.13.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.14.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.14.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.14.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.15.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.15.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.15.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.16.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.16.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.16.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.17.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.17.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.17.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.18.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.18.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.18.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.19.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.19.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.19.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.2.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.2.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.20.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.20.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.20.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.21.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.21.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.21.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.22.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.22.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.22.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.23.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.23.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.23.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.24.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.24.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.24.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.25.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.25.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.25.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.26.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.26.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.26.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.27.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.27.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.27.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.28.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.28.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.28.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.29.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.29.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.29.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.3.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.3.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.3.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.30.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.30.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.30.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.31.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.31.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.31.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.32.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.32.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.32.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.33.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.33.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.33.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.34.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.34.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.34.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.35.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.35.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.35.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.36.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.36.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.36.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.37.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.37.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.37.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.38.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.38.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.38.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.39.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.39.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.39.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.4.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.4.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.4.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.40.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.40.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.40.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.41.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.41.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.41.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.42.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.42.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.42.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.43.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.43.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.43.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.44.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.44.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.44.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.45.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.45.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.45.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.46.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.46.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.46.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.47.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.47.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.47.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.48.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.48.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.48.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.49.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.49.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.49.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.5.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.5.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.5.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.50.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.50.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.50.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.51.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.51.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.51.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.52.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.52.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.52.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.53.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.53.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.53.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.54.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.54.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.54.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.55.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.55.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.55.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.56.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.56.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.56.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.57.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.57.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.57.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.58.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.58.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.58.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.59.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.59.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.59.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.6.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.6.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.60.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.60.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.60.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.61.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.61.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.61.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.62.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.62.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.62.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.63.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.63.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.63.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.7.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.7.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.7.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.8.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.8.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.8.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.9.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.9.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.26.block_sparse_moe.experts.9.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.26.block_sparse_moe.gate.weight": "model-00005-of-00007.safetensors", + "model.layers.26.input_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.26.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.26.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.26.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.0.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.1.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.1.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.1.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.10.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.10.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.10.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.11.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.11.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.11.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.12.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.12.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.12.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.13.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.13.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.13.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.14.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.14.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.14.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.15.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.15.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.15.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.16.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.16.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.16.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.17.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.17.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.17.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.18.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.18.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.18.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.19.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.19.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.19.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.2.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.20.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.20.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.20.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.21.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.21.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.21.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.22.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.22.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.22.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.23.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.23.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.23.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.24.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.24.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.24.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.25.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.25.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.25.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.26.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.26.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.26.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.27.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.27.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.27.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.28.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.28.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.28.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.29.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.29.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.29.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.3.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.30.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.30.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.30.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.31.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.31.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.31.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.32.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.32.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.32.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.33.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.33.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.33.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.34.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.34.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.34.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.35.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.35.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.35.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.36.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.36.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.36.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.37.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.37.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.37.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.38.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.38.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.38.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.39.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.39.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.39.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.4.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.4.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.40.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.40.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.40.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.41.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.41.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.41.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.42.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.42.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.42.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.43.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.43.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.43.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.44.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.44.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.44.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.45.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.45.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.45.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.46.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.46.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.46.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.47.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.47.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.47.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.48.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.48.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.48.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.49.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.49.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.49.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.5.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.5.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.5.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.50.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.50.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.50.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.51.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.51.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.51.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.52.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.52.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.52.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.53.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.53.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.53.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.54.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.54.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.54.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.55.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.55.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.55.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.56.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.56.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.56.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.57.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.57.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.57.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.58.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.58.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.58.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.59.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.59.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.59.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.6.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.6.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.6.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.60.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.60.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.60.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.61.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.61.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.61.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.62.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.62.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.62.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.63.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.63.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.63.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.7.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.7.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.7.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.8.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.8.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.8.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.9.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.9.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.27.block_sparse_moe.experts.9.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.27.block_sparse_moe.gate.weight": "model-00006-of-00007.safetensors", + "model.layers.27.input_layernorm.weight": "model-00005-of-00007.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.27.self_attn.k_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.27.self_attn.q_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.27.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.0.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.0.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.1.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.1.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.10.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.10.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.10.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.11.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.11.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.11.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.12.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.12.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.12.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.13.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.13.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.13.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.14.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.14.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.14.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.15.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.15.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.15.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.16.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.16.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.16.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.17.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.17.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.17.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.18.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.18.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.18.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.19.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.19.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.19.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.2.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.2.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.2.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.20.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.20.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.20.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.21.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.21.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.21.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.22.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.22.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.22.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.23.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.23.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.23.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.24.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.24.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.24.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.25.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.25.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.25.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.26.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.26.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.26.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.27.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.27.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.27.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.28.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.28.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.28.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.29.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.29.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.29.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.3.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.3.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.3.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.30.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.30.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.30.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.31.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.31.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.31.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.32.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.32.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.32.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.33.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.33.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.33.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.34.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.34.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.34.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.35.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.35.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.35.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.36.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.36.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.36.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.37.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.37.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.37.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.38.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.38.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.38.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.39.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.39.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.39.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.4.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.4.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.40.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.40.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.40.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.41.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.41.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.41.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.42.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.42.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.42.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.43.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.43.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.43.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.44.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.44.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.44.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.45.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.45.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.45.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.46.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.46.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.46.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.47.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.47.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.47.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.48.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.48.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.48.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.49.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.49.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.49.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.5.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.5.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.50.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.50.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.50.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.51.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.51.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.51.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.52.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.52.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.52.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.53.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.53.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.53.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.54.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.54.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.54.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.55.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.55.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.55.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.56.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.56.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.56.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.57.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.57.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.57.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.58.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.58.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.58.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.59.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.59.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.59.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.6.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.6.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.6.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.60.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.60.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.60.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.61.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.61.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.61.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.62.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.62.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.62.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.63.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.63.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.63.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.7.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.7.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.7.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.8.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.8.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.8.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.9.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.9.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.28.block_sparse_moe.experts.9.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.28.block_sparse_moe.gate.weight": "model-00004-of-00007.safetensors", + "model.layers.28.input_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.28.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.28.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.28.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.0.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.0.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.1.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.1.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.1.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.10.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.10.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.10.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.11.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.11.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.11.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.12.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.12.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.12.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.13.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.13.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.13.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.14.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.14.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.14.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.15.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.15.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.15.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.16.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.16.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.16.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.17.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.17.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.17.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.18.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.18.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.18.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.19.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.19.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.19.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.2.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.2.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.2.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.20.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.20.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.20.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.21.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.21.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.21.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.22.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.22.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.22.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.23.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.23.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.23.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.24.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.24.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.24.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.25.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.25.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.25.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.26.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.26.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.26.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.27.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.27.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.27.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.28.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.28.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.28.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.29.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.29.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.29.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.3.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.3.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.30.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.30.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.30.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.31.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.31.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.31.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.32.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.32.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.32.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.33.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.33.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.33.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.34.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.34.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.34.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.35.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.35.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.35.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.36.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.36.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.36.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.37.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.37.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.37.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.38.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.38.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.38.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.39.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.39.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.39.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.4.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.4.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.4.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.40.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.40.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.40.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.41.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.41.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.41.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.42.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.42.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.42.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.43.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.43.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.43.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.44.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.44.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.44.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.45.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.45.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.45.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.46.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.46.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.46.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.47.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.47.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.47.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.48.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.48.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.48.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.49.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.49.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.49.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.5.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.5.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.5.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.50.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.50.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.50.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.51.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.51.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.51.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.52.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.52.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.52.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.53.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.53.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.53.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.54.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.54.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.54.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.55.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.55.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.55.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.56.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.56.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.56.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.57.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.57.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.57.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.58.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.58.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.58.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.59.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.59.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.59.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.6.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.6.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.60.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.60.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.60.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.61.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.61.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.61.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.62.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.62.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.62.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.63.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.63.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.63.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.7.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.7.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.7.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.8.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.8.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.8.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.9.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.9.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.29.block_sparse_moe.experts.9.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.29.block_sparse_moe.gate.weight": "model-00003-of-00007.safetensors", + "model.layers.29.input_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.29.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.29.self_attn.q_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.29.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.0.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.0.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.0.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.1.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.1.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.10.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.10.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.10.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.11.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.11.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.11.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.12.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.12.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.12.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.13.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.13.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.13.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.14.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.14.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.14.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.15.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.15.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.15.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.16.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.16.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.16.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.17.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.17.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.17.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.18.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.18.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.18.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.19.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.19.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.19.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.2.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.2.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.2.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.20.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.20.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.20.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.21.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.21.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.21.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.22.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.22.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.22.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.23.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.23.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.23.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.24.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.24.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.24.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.25.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.25.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.25.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.26.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.26.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.26.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.27.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.27.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.27.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.28.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.28.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.28.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.29.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.29.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.29.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.3.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.3.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.30.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.30.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.30.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.31.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.31.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.31.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.32.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.32.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.32.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.33.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.33.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.33.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.34.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.34.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.34.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.35.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.35.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.35.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.36.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.36.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.36.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.37.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.37.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.37.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.38.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.38.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.38.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.39.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.39.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.39.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.4.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.4.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.4.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.40.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.40.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.40.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.41.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.41.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.41.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.42.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.42.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.42.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.43.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.43.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.43.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.44.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.44.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.44.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.45.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.45.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.45.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.46.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.46.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.46.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.47.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.47.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.47.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.48.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.48.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.48.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.49.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.49.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.49.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.5.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.5.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.5.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.50.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.50.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.50.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.51.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.51.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.51.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.52.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.52.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.52.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.53.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.53.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.53.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.54.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.54.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.54.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.55.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.55.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.55.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.56.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.56.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.56.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.57.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.57.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.57.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.58.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.58.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.58.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.59.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.59.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.59.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.6.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.6.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.6.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.60.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.60.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.60.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.61.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.61.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.61.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.62.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.62.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.62.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.63.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.63.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.63.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.7.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.7.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.7.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.8.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.8.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.8.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.9.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.9.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.experts.9.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.3.block_sparse_moe.gate.weight": "model-00003-of-00007.safetensors", + "model.layers.3.input_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.3.self_attn.k_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.3.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.3.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.0.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.0.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.0.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.1.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.1.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.10.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.10.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.10.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.11.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.11.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.11.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.12.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.12.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.12.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.13.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.13.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.13.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.14.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.14.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.14.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.15.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.15.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.15.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.16.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.16.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.16.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.17.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.17.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.17.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.18.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.18.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.18.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.19.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.19.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.19.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.2.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.2.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.20.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.20.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.20.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.21.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.21.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.21.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.22.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.22.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.22.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.23.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.23.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.23.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.24.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.24.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.24.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.25.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.25.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.25.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.26.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.26.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.26.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.27.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.27.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.27.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.28.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.28.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.28.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.29.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.29.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.29.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.3.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.3.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.30.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.30.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.30.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.31.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.31.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.31.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.32.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.32.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.32.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.33.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.33.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.33.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.34.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.34.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.34.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.35.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.35.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.35.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.36.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.36.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.36.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.37.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.37.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.37.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.38.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.38.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.38.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.39.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.39.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.39.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.4.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.4.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.40.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.40.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.40.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.41.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.41.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.41.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.42.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.42.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.42.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.43.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.43.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.43.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.44.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.44.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.44.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.45.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.45.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.45.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.46.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.46.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.46.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.47.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.47.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.47.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.48.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.48.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.48.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.49.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.49.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.49.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.5.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.5.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.5.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.50.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.50.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.50.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.51.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.51.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.51.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.52.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.52.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.52.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.53.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.53.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.53.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.54.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.54.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.54.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.55.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.55.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.55.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.56.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.56.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.56.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.57.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.57.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.57.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.58.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.58.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.58.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.59.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.59.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.59.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.6.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.6.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.6.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.60.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.60.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.60.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.61.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.61.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.61.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.62.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.62.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.62.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.63.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.63.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.63.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.7.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.7.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.8.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.8.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.8.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.9.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.9.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.30.block_sparse_moe.experts.9.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.30.block_sparse_moe.gate.weight": "model-00006-of-00007.safetensors", + "model.layers.30.input_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00004-of-00007.safetensors", + "model.layers.30.self_attn.k_proj.weight": "model-00007-of-00007.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.30.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.30.self_attn.v_proj.weight": "model-00007-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.0.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.0.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.0.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.1.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.1.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.1.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.10.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.10.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.10.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.11.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.11.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.11.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.12.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.12.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.12.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.13.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.13.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.13.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.14.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.14.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.14.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.15.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.15.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.15.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.16.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.16.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.16.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.17.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.17.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.17.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.18.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.18.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.18.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.19.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.19.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.19.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.2.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.2.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.20.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.20.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.20.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.21.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.21.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.21.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.22.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.22.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.22.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.23.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.23.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.23.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.24.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.24.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.24.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.25.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.25.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.25.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.26.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.26.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.26.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.27.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.27.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.27.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.28.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.28.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.28.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.29.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.29.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.29.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.3.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.3.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.3.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.30.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.30.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.30.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.31.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.31.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.31.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.32.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.32.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.32.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.33.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.33.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.33.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.34.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.34.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.34.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.35.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.35.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.35.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.36.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.36.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.36.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.37.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.37.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.37.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.38.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.38.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.38.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.39.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.39.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.39.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.4.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.4.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.4.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.40.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.40.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.40.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.41.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.41.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.41.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.42.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.42.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.42.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.43.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.43.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.43.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.44.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.44.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.44.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.45.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.45.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.45.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.46.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.46.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.46.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.47.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.47.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.47.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.48.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.48.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.48.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.49.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.49.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.49.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.5.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.5.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.5.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.50.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.50.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.50.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.51.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.51.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.51.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.52.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.52.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.52.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.53.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.53.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.53.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.54.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.54.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.54.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.55.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.55.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.55.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.56.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.56.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.56.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.57.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.57.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.57.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.58.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.58.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.58.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.59.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.59.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.59.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.6.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.6.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.60.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.60.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.60.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.61.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.61.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.61.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.62.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.62.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.62.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.63.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.63.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.63.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.7.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.7.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.8.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.8.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.8.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.9.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.9.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.31.block_sparse_moe.experts.9.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.31.block_sparse_moe.gate.weight": "model-00006-of-00007.safetensors", + "model.layers.31.input_layernorm.weight": "model-00005-of-00007.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.31.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.31.self_attn.q_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.31.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.0.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.0.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.0.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.1.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.1.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.10.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.10.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.10.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.11.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.11.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.11.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.12.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.12.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.12.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.13.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.13.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.13.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.14.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.14.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.14.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.15.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.15.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.15.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.16.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.16.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.16.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.17.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.17.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.17.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.18.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.18.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.18.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.19.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.19.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.19.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.2.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.2.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.2.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.20.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.20.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.20.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.21.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.21.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.21.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.22.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.22.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.22.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.23.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.23.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.23.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.24.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.24.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.24.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.25.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.25.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.25.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.26.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.26.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.26.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.27.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.27.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.27.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.28.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.28.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.28.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.29.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.29.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.29.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.3.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.3.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.3.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.30.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.30.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.30.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.31.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.31.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.31.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.32.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.32.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.32.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.33.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.33.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.33.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.34.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.34.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.34.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.35.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.35.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.35.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.36.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.36.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.36.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.37.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.37.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.37.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.38.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.38.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.38.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.39.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.39.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.39.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.4.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.4.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.4.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.40.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.40.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.40.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.41.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.41.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.41.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.42.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.42.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.42.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.43.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.43.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.43.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.44.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.44.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.44.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.45.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.45.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.45.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.46.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.46.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.46.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.47.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.47.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.47.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.48.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.48.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.48.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.49.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.49.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.49.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.5.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.5.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.5.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.50.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.50.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.50.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.51.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.51.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.51.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.52.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.52.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.52.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.53.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.53.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.53.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.54.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.54.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.54.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.55.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.55.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.55.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.56.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.56.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.56.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.57.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.57.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.57.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.58.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.58.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.58.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.59.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.59.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.59.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.6.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.6.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.6.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.60.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.60.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.60.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.61.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.61.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.61.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.62.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.62.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.62.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.63.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.63.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.63.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.7.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.7.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.7.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.8.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.8.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.8.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.9.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.9.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.4.block_sparse_moe.experts.9.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.4.block_sparse_moe.gate.weight": "model-00006-of-00007.safetensors", + "model.layers.4.input_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.4.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.4.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.4.self_attn.v_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.0.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.0.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.0.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.1.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.1.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.10.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.10.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.10.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.11.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.11.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.11.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.12.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.12.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.12.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.13.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.13.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.13.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.14.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.14.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.14.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.15.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.15.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.15.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.16.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.16.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.16.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.17.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.17.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.17.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.18.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.18.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.18.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.19.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.19.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.19.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.2.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.2.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.2.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.20.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.20.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.20.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.21.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.21.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.21.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.22.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.22.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.22.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.23.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.23.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.23.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.24.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.24.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.24.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.25.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.25.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.25.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.26.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.26.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.26.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.27.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.27.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.27.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.28.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.28.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.28.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.29.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.29.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.29.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.3.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.3.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.3.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.30.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.30.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.30.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.31.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.31.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.31.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.32.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.32.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.32.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.33.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.33.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.33.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.34.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.34.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.34.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.35.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.35.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.35.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.36.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.36.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.36.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.37.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.37.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.37.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.38.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.38.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.38.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.39.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.39.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.39.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.4.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.4.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.4.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.40.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.40.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.40.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.41.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.41.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.41.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.42.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.42.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.42.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.43.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.43.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.43.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.44.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.44.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.44.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.45.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.45.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.45.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.46.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.46.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.46.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.47.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.47.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.47.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.48.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.48.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.48.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.49.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.49.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.49.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.5.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.5.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.50.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.50.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.50.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.51.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.51.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.51.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.52.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.52.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.52.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.53.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.53.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.53.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.54.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.54.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.54.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.55.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.55.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.55.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.56.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.56.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.56.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.57.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.57.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.57.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.58.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.58.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.58.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.59.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.59.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.59.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.6.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.6.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.6.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.60.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.60.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.60.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.61.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.61.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.61.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.62.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.62.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.62.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.63.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.63.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.63.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.7.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.7.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.7.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.8.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.8.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.8.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.9.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.9.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.5.block_sparse_moe.experts.9.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.5.block_sparse_moe.gate.weight": "model-00002-of-00007.safetensors", + "model.layers.5.input_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00004-of-00007.safetensors", + "model.layers.5.self_attn.k_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.5.self_attn.q_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.5.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.0.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.0.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.1.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.10.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.10.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.10.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.11.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.11.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.11.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.12.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.12.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.12.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.13.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.13.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.13.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.14.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.14.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.14.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.15.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.15.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.15.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.16.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.16.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.16.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.17.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.17.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.17.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.18.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.18.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.18.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.19.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.19.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.19.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.2.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.2.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.2.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.20.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.20.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.20.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.21.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.21.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.21.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.22.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.22.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.22.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.23.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.23.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.23.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.24.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.24.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.24.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.25.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.25.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.25.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.26.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.26.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.26.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.27.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.27.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.27.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.28.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.28.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.28.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.29.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.29.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.29.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.3.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.3.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.30.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.30.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.30.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.31.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.31.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.31.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.32.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.32.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.32.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.33.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.33.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.33.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.34.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.34.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.34.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.35.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.35.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.35.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.36.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.36.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.36.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.37.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.37.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.37.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.38.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.38.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.38.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.39.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.39.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.39.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.4.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.4.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.4.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.40.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.40.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.40.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.41.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.41.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.41.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.42.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.42.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.42.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.43.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.43.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.43.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.44.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.44.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.44.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.45.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.45.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.45.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.46.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.46.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.46.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.47.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.47.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.47.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.48.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.48.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.48.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.49.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.49.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.49.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.5.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.5.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.50.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.50.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.50.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.51.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.51.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.51.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.52.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.52.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.52.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.53.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.53.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.53.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.54.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.54.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.54.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.55.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.55.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.55.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.56.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.56.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.56.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.57.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.57.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.57.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.58.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.58.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.58.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.59.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.59.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.59.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.6.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.6.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.6.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.60.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.60.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.60.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.61.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.61.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.61.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.62.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.62.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.62.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.63.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.63.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.63.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.7.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.7.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.7.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.8.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.8.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.8.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.9.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.9.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.experts.9.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.6.block_sparse_moe.gate.weight": "model-00002-of-00007.safetensors", + "model.layers.6.input_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.6.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.6.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.6.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.0.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.0.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.1.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.1.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.1.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.10.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.10.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.10.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.11.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.11.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.11.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.12.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.12.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.12.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.13.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.13.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.13.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.14.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.14.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.14.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.15.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.15.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.15.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.16.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.16.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.16.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.17.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.17.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.17.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.18.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.18.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.18.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.19.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.19.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.19.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.2.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.2.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.2.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.20.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.20.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.20.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.21.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.21.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.21.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.22.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.22.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.22.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.23.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.23.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.23.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.24.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.24.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.24.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.25.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.25.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.25.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.26.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.26.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.26.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.27.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.27.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.27.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.28.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.28.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.28.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.29.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.29.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.29.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.3.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.3.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.3.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.30.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.30.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.30.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.31.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.31.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.31.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.32.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.32.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.32.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.33.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.33.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.33.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.34.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.34.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.34.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.35.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.35.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.35.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.36.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.36.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.36.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.37.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.37.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.37.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.38.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.38.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.38.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.39.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.39.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.39.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.4.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.4.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.4.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.40.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.40.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.40.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.41.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.41.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.41.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.42.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.42.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.42.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.43.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.43.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.43.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.44.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.44.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.44.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.45.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.45.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.45.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.46.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.46.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.46.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.47.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.47.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.47.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.48.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.48.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.48.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.49.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.49.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.49.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.5.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.5.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.5.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.50.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.50.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.50.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.51.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.51.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.51.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.52.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.52.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.52.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.53.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.53.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.53.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.54.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.54.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.54.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.55.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.55.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.55.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.56.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.56.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.56.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.57.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.57.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.57.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.58.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.58.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.58.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.59.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.59.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.59.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.6.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.6.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.6.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.60.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.60.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.60.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.61.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.61.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.61.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.62.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.62.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.62.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.63.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.63.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.63.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.7.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.7.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.8.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.8.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.8.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.9.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.9.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.7.block_sparse_moe.experts.9.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.7.block_sparse_moe.gate.weight": "model-00005-of-00007.safetensors", + "model.layers.7.input_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.7.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.7.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.7.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.0.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.0.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.0.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.1.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.1.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.10.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.10.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.10.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.11.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.11.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.11.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.12.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.12.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.12.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.13.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.13.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.13.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.14.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.14.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.14.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.15.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.15.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.15.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.16.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.16.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.16.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.17.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.17.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.17.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.18.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.18.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.18.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.19.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.19.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.19.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.2.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.2.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.2.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.20.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.20.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.20.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.21.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.21.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.21.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.22.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.22.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.22.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.23.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.23.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.23.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.24.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.24.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.24.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.25.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.25.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.25.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.26.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.26.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.26.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.27.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.27.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.27.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.28.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.28.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.28.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.29.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.29.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.29.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.3.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.3.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.3.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.30.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.30.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.30.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.31.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.31.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.31.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.32.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.32.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.32.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.33.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.33.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.33.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.34.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.34.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.34.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.35.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.35.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.35.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.36.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.36.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.36.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.37.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.37.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.37.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.38.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.38.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.38.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.39.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.39.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.39.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.4.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.4.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.4.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.40.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.40.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.40.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.41.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.41.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.41.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.42.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.42.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.42.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.43.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.43.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.43.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.44.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.44.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.44.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.45.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.45.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.45.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.46.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.46.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.46.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.47.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.47.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.47.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.48.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.48.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.48.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.49.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.49.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.49.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.5.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.5.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.50.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.50.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.50.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.51.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.51.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.51.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.52.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.52.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.52.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.53.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.53.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.53.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.54.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.54.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.54.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.55.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.55.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.55.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.56.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.56.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.56.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.57.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.57.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.57.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.58.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.58.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.58.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.59.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.59.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.59.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.6.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.6.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.6.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.60.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.60.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.60.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.61.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.61.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.61.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.62.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.62.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.62.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.63.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.63.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.63.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.7.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.7.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.7.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.8.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.8.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.8.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.9.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.9.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.8.block_sparse_moe.experts.9.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.8.block_sparse_moe.gate.weight": "model-00002-of-00007.safetensors", + "model.layers.8.input_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.8.self_attn.k_proj.weight": "model-00007-of-00007.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.8.self_attn.q_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.8.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.0.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.0.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.0.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.1.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.1.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.1.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.10.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.10.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.10.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.11.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.11.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.11.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.12.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.12.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.12.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.13.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.13.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.13.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.14.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.14.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.14.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.15.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.15.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.15.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.16.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.16.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.16.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.17.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.17.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.17.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.18.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.18.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.18.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.19.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.19.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.19.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.2.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.2.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.2.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.20.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.20.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.20.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.21.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.21.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.21.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.22.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.22.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.22.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.23.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.23.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.23.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.24.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.24.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.24.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.25.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.25.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.25.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.26.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.26.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.26.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.27.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.27.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.27.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.28.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.28.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.28.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.29.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.29.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.29.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.3.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.3.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.3.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.30.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.30.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.30.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.31.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.31.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.31.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.32.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.32.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.32.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.33.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.33.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.33.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.34.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.34.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.34.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.35.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.35.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.35.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.36.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.36.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.36.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.37.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.37.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.37.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.38.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.38.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.38.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.39.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.39.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.39.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.4.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.4.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.4.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.40.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.40.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.40.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.41.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.41.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.41.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.42.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.42.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.42.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.43.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.43.w2.weight": "model-00007-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.43.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.44.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.44.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.44.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.45.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.45.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.45.w3.weight": "model-00007-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.46.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.46.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.46.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.47.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.47.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.47.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.48.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.48.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.48.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.49.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.49.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.49.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.5.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.5.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.5.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.50.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.50.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.50.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.51.w1.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.51.w2.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.51.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.52.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.52.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.52.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.53.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.53.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.53.w3.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.54.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.54.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.54.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.55.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.55.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.55.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.56.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.56.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.56.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.57.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.57.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.57.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.58.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.58.w2.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.58.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.59.w1.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.59.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.59.w3.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.6.w1.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.6.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.6.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.60.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.60.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.60.w3.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.61.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.61.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.61.w3.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.62.w1.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.62.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.62.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.63.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.63.w2.weight": "model-00003-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.63.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.7.w1.weight": "model-00007-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.7.w2.weight": "model-00004-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.7.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.8.w1.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.8.w2.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.8.w3.weight": "model-00002-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.9.w1.weight": "model-00001-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.9.w2.weight": "model-00006-of-00007.safetensors", + "model.layers.9.block_sparse_moe.experts.9.w3.weight": "model-00005-of-00007.safetensors", + "model.layers.9.block_sparse_moe.gate.weight": "model-00001-of-00007.safetensors", + "model.layers.9.input_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.9.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.9.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.9.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", + "model.norm.weight": "model-00001-of-00007.safetensors" + } +} diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..278b7f0 --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,23 @@ +{ + "bos_token": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "eos_token": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": { + "content": "<|end_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..b30d9b2 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d44e2a3cfdfa7530be35f0d72c39b37ff438d4a1e69cc285b3ee461987d0bfa7 +size 17210623 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..fe5b44b --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,2092 @@ +{ + "added_tokens_decoder": { + "128000": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128001": { + "content": "<|end_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128002": { + "content": "<|reserved_special_token_0|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128003": { + "content": "<|reserved_special_token_1|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128004": { + "content": "<|reserved_special_token_2|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128005": { + "content": "<|reserved_special_token_3|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128006": { + "content": "<|start_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128007": { + "content": "<|end_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128008": { + "content": "<|reserved_special_token_4|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128009": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128010": { + "content": "<|reserved_special_token_5|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128011": { + "content": "<|reserved_special_token_6|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128012": { + "content": "<|reserved_special_token_7|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128013": { + "content": "<|reserved_special_token_8|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128014": { + "content": "<|reserved_special_token_9|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128015": { + "content": "<|reserved_special_token_10|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128016": { + "content": "<|reserved_special_token_11|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128017": { + "content": "<|reserved_special_token_12|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128018": { + "content": "<|reserved_special_token_13|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128019": { + "content": "<|reserved_special_token_14|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128020": { + "content": "<|reserved_special_token_15|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128021": { + "content": "<|reserved_special_token_16|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128022": { + "content": "<|reserved_special_token_17|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128023": { + "content": "<|reserved_special_token_18|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128024": { + "content": "<|reserved_special_token_19|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128025": { + "content": "<|reserved_special_token_20|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128026": { + "content": "<|reserved_special_token_21|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128027": { + "content": "<|reserved_special_token_22|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128028": { + "content": "<|reserved_special_token_23|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128029": { + "content": "<|reserved_special_token_24|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128030": { + "content": "<|reserved_special_token_25|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128031": { + "content": "<|reserved_special_token_26|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128032": { + "content": "<|reserved_special_token_27|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128033": { + "content": "<|reserved_special_token_28|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128034": { + "content": "<|reserved_special_token_29|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128035": { + "content": "<|reserved_special_token_30|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128036": { + "content": "<|reserved_special_token_31|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128037": { + "content": "<|reserved_special_token_32|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128038": { + "content": "<|reserved_special_token_33|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128039": { + "content": "<|reserved_special_token_34|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128040": { + "content": "<|reserved_special_token_35|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128041": { + "content": "<|reserved_special_token_36|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128042": { + "content": "<|reserved_special_token_37|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128043": { + "content": "<|reserved_special_token_38|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128044": { + "content": "<|reserved_special_token_39|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128045": { + "content": "<|reserved_special_token_40|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128046": { + "content": "<|reserved_special_token_41|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128047": { + "content": "<|reserved_special_token_42|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128048": { + "content": "<|reserved_special_token_43|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128049": { + "content": "<|reserved_special_token_44|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128050": { + "content": "<|reserved_special_token_45|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128051": { + "content": "<|reserved_special_token_46|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128052": { + "content": "<|reserved_special_token_47|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128053": { + "content": "<|reserved_special_token_48|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128054": { + "content": "<|reserved_special_token_49|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128055": { + "content": "<|reserved_special_token_50|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128056": { + "content": "<|reserved_special_token_51|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128057": { + "content": "<|reserved_special_token_52|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128058": { + "content": "<|reserved_special_token_53|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128059": { + "content": "<|reserved_special_token_54|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128060": { + "content": "<|reserved_special_token_55|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128061": { + "content": "<|reserved_special_token_56|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128062": { + "content": "<|reserved_special_token_57|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128063": { + "content": "<|reserved_special_token_58|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128064": { + "content": "<|reserved_special_token_59|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128065": { + "content": "<|reserved_special_token_60|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128066": { + "content": "<|reserved_special_token_61|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128067": { + "content": "<|reserved_special_token_62|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128068": { + "content": "<|reserved_special_token_63|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128069": { + "content": "<|reserved_special_token_64|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128070": { + "content": "<|reserved_special_token_65|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128071": { + "content": "<|reserved_special_token_66|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128072": { + "content": "<|reserved_special_token_67|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128073": { + "content": "<|reserved_special_token_68|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128074": { + "content": "<|reserved_special_token_69|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128075": { + "content": "<|reserved_special_token_70|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128076": { + "content": "<|reserved_special_token_71|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128077": { + "content": "<|reserved_special_token_72|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128078": { + "content": "<|reserved_special_token_73|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128079": { + "content": "<|reserved_special_token_74|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128080": { + "content": "<|reserved_special_token_75|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128081": { + "content": "<|reserved_special_token_76|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128082": { + "content": "<|reserved_special_token_77|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128083": { + "content": "<|reserved_special_token_78|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128084": { + "content": "<|reserved_special_token_79|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128085": { + "content": "<|reserved_special_token_80|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128086": { + "content": "<|reserved_special_token_81|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128087": { + "content": "<|reserved_special_token_82|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128088": { + "content": "<|reserved_special_token_83|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128089": { + "content": "<|reserved_special_token_84|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128090": { + "content": "<|reserved_special_token_85|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128091": { + "content": "<|reserved_special_token_86|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128092": { + "content": "<|reserved_special_token_87|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128093": { + "content": "<|reserved_special_token_88|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128094": { + "content": "<|reserved_special_token_89|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128095": { + "content": "<|reserved_special_token_90|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128096": { + "content": "<|reserved_special_token_91|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128097": { + "content": "<|reserved_special_token_92|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128098": { + "content": "<|reserved_special_token_93|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128099": { + "content": "<|reserved_special_token_94|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128100": { + "content": "<|reserved_special_token_95|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128101": { + "content": "<|reserved_special_token_96|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128102": { + "content": "<|reserved_special_token_97|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128103": { + "content": "<|reserved_special_token_98|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128104": { + "content": "<|reserved_special_token_99|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128105": { + "content": "<|reserved_special_token_100|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128106": { + "content": "<|reserved_special_token_101|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128107": { + "content": "<|reserved_special_token_102|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128108": { + "content": "<|reserved_special_token_103|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128109": { + "content": "<|reserved_special_token_104|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128110": { + "content": "<|reserved_special_token_105|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128111": { + "content": "<|reserved_special_token_106|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128112": { + "content": "<|reserved_special_token_107|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128113": { + "content": "<|reserved_special_token_108|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128114": { + "content": "<|reserved_special_token_109|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128115": { + "content": "<|reserved_special_token_110|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128116": { + "content": "<|reserved_special_token_111|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128117": { + "content": "<|reserved_special_token_112|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128118": { + "content": "<|reserved_special_token_113|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128119": { + "content": "<|reserved_special_token_114|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128120": { + "content": "<|reserved_special_token_115|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128121": { + "content": "<|reserved_special_token_116|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128122": { + "content": "<|reserved_special_token_117|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128123": { + "content": "<|reserved_special_token_118|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128124": { + "content": "<|reserved_special_token_119|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128125": { + "content": "<|reserved_special_token_120|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128126": { + "content": "<|reserved_special_token_121|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128127": { + "content": "<|reserved_special_token_122|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128128": { + "content": "<|reserved_special_token_123|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128129": { + "content": "<|reserved_special_token_124|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128130": { + "content": "<|reserved_special_token_125|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128131": { + "content": "<|reserved_special_token_126|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128132": { + "content": "<|reserved_special_token_127|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128133": { + "content": "<|reserved_special_token_128|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128134": { + "content": "<|reserved_special_token_129|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128135": { + "content": "<|reserved_special_token_130|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128136": { + "content": "<|reserved_special_token_131|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128137": { + "content": "<|reserved_special_token_132|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128138": { + "content": "<|reserved_special_token_133|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128139": { + "content": "<|reserved_special_token_134|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128140": { + "content": "<|reserved_special_token_135|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128141": { + "content": "<|reserved_special_token_136|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128142": { + "content": "<|reserved_special_token_137|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128143": { + "content": "<|reserved_special_token_138|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128144": { + "content": "<|reserved_special_token_139|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128145": { + "content": "<|reserved_special_token_140|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128146": { + "content": "<|reserved_special_token_141|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128147": { + "content": "<|reserved_special_token_142|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128148": { + "content": "<|reserved_special_token_143|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128149": { + "content": "<|reserved_special_token_144|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128150": { + "content": "<|reserved_special_token_145|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128151": { + "content": "<|reserved_special_token_146|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128152": { + "content": "<|reserved_special_token_147|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128153": { + "content": "<|reserved_special_token_148|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128154": { + "content": "<|reserved_special_token_149|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128155": { + "content": "<|reserved_special_token_150|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128156": { + "content": "<|reserved_special_token_151|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128157": { + "content": "<|reserved_special_token_152|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128158": { + "content": "<|reserved_special_token_153|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128159": { + "content": "<|reserved_special_token_154|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128160": { + "content": "<|reserved_special_token_155|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128161": { + "content": "<|reserved_special_token_156|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128162": { + "content": "<|reserved_special_token_157|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128163": { + "content": "<|reserved_special_token_158|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128164": { + "content": "<|reserved_special_token_159|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128165": { + "content": "<|reserved_special_token_160|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128166": { + "content": "<|reserved_special_token_161|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128167": { + "content": "<|reserved_special_token_162|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128168": { + "content": "<|reserved_special_token_163|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128169": { + "content": "<|reserved_special_token_164|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128170": { + "content": "<|reserved_special_token_165|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128171": { + "content": "<|reserved_special_token_166|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128172": { + "content": "<|reserved_special_token_167|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128173": { + "content": "<|reserved_special_token_168|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128174": { + "content": "<|reserved_special_token_169|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128175": { + "content": "<|reserved_special_token_170|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128176": { + "content": "<|reserved_special_token_171|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128177": { + "content": "<|reserved_special_token_172|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128178": { + "content": "<|reserved_special_token_173|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128179": { + "content": "<|reserved_special_token_174|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128180": { + "content": "<|reserved_special_token_175|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128181": { + "content": "<|reserved_special_token_176|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128182": { + "content": "<|reserved_special_token_177|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128183": { + "content": "<|reserved_special_token_178|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128184": { + "content": "<|reserved_special_token_179|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128185": { + "content": "<|reserved_special_token_180|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128186": { + "content": "<|reserved_special_token_181|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128187": { + "content": "<|reserved_special_token_182|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128188": { + "content": "<|reserved_special_token_183|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128189": { + "content": "<|reserved_special_token_184|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128190": { + "content": "<|reserved_special_token_185|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128191": { + "content": "<|reserved_special_token_186|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128192": { + "content": "<|reserved_special_token_187|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128193": { + "content": "<|reserved_special_token_188|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128194": { + "content": "<|reserved_special_token_189|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128195": { + "content": "<|reserved_special_token_190|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128196": { + "content": "<|reserved_special_token_191|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128197": { + "content": "<|reserved_special_token_192|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128198": { + "content": "<|reserved_special_token_193|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128199": { + "content": "<|reserved_special_token_194|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128200": { + "content": "<|reserved_special_token_195|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128201": { + "content": "<|reserved_special_token_196|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128202": { + "content": "<|reserved_special_token_197|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128203": { + "content": "<|reserved_special_token_198|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128204": { + "content": "<|reserved_special_token_199|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128205": { + "content": "<|reserved_special_token_200|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128206": { + "content": "<|reserved_special_token_201|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128207": { + "content": "<|reserved_special_token_202|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128208": { + "content": "<|reserved_special_token_203|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128209": { + "content": "<|reserved_special_token_204|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128210": { + "content": "<|reserved_special_token_205|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128211": { + "content": "<|reserved_special_token_206|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128212": { + "content": "<|reserved_special_token_207|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128213": { + "content": "<|reserved_special_token_208|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128214": { + "content": "<|reserved_special_token_209|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128215": { + "content": "<|reserved_special_token_210|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128216": { + "content": "<|reserved_special_token_211|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128217": { + "content": "<|reserved_special_token_212|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128218": { + "content": "<|reserved_special_token_213|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128219": { + "content": "<|reserved_special_token_214|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128220": { + "content": "<|reserved_special_token_215|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128221": { + "content": "<|reserved_special_token_216|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128222": { + "content": "<|reserved_special_token_217|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128223": { + "content": "<|reserved_special_token_218|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128224": { + "content": "<|reserved_special_token_219|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128225": { + "content": "<|reserved_special_token_220|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128226": { + "content": "<|reserved_special_token_221|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128227": { + "content": "<|reserved_special_token_222|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128228": { + "content": "<|reserved_special_token_223|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128229": { + "content": "<|reserved_special_token_224|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128230": { + "content": "<|reserved_special_token_225|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128231": { + "content": "<|reserved_special_token_226|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128232": { + "content": "<|reserved_special_token_227|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128233": { + "content": "<|reserved_special_token_228|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128234": { + "content": "<|reserved_special_token_229|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128235": { + "content": "<|reserved_special_token_230|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128236": { + "content": "<|reserved_special_token_231|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128237": { + "content": "<|reserved_special_token_232|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128238": { + "content": "<|reserved_special_token_233|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128239": { + "content": "<|reserved_special_token_234|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128240": { + "content": "<|reserved_special_token_235|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128241": { + "content": "<|reserved_special_token_236|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128242": { + "content": "<|reserved_special_token_237|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128243": { + "content": "<|reserved_special_token_238|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128244": { + "content": "<|reserved_special_token_239|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128245": { + "content": "<|reserved_special_token_240|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128246": { + "content": "<|reserved_special_token_241|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128247": { + "content": "<|reserved_special_token_242|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128248": { + "content": "<|reserved_special_token_243|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128249": { + "content": "<|reserved_special_token_244|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128250": { + "content": "<|reserved_special_token_245|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128251": { + "content": "<|reserved_special_token_246|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128252": { + "content": "<|reserved_special_token_247|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128253": { + "content": "<|reserved_special_token_248|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128254": { + "content": "<|reserved_special_token_249|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128255": { + "content": "<|reserved_special_token_250|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128256": { + "content": "<|eom_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128257": { + "content": "<|python_tag|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128258": { + "content": "<|NONE|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + } + }, + "bos_token": "<|begin_of_text|>", + "chat_template": "{# version=v3-llama3.1 #}{%- macro append_new_param_info(param_declaration, comment_info, examples_info, depth) -%}\n {%- set offset = \"\" -%}\n {%- if depth >= 1 -%}\n {%- set offset = \" \" * depth -%}\n {%- endif -%}\n {%- if comment_info != \"<|NONE|>\" -%}\n {{ \"\\n\" + offset + comment_info }}\n {%- if examples_info | length > 0 -%}\n {# Append each example info #}\n {%- for example in examples_info -%}\n {{ \"\\n\" + offset + \"// \" + example|string|replace(\"'\", '\"') }}\n {%- endfor -%}\n {%- endif -%}\n {%- endif -%}\n {{ \"\\n\" + offset + param_declaration }}\n{%- endmacro -%}\n\n{%- macro convert_data_type(param_type) -%}\n {%- if param_type == \"integer\" or param_type == \"float\" -%}\n {{ \"number\" }}\n {%- else -%}\n {{ param_type }}\n {%- endif -%}\n{%- endmacro -%}\n\n{%- macro get_param_type(param) -%}\n {%- set param_type = \"any\" -%}\n\n {%- if \"type\" in param -%}\n {%- set raw_param_type = param[\"type\"] -%}\n {%- if raw_param_type is iterable and raw_param_type is not string -%}\n {%- set param_type = raw_param_type | join(\" | \") -%}\n {%- else -%}\n {%- set param_type = raw_param_type -%}\n {%- endif -%}\n {{ convert_data_type(param_type) }}\n {%- elif \"oneOf\" in param -%}\n {%- set one_of_types = param[\"oneOf\"]|selectattr(\"type\", \"defined\")|list -%}\n {%- set one_of_types = one_of_types|map(attribute=\"type\")|unique|list -%}\n {{ convert_data_type(one_of_types | join(\" | \")) }}\n {%- endif -%}\n{%- endmacro -%}\n\n{%- macro get_format_param(param) -%}\n {%- if \"format\" in param -%}\n {{ param[\"format\"] }}\n {%- elif \"oneOf\" in param -%}\n {%- set formats = [] -%}\n {%- for item in param[\"oneOf\"] -%}\n {%- if \"format\" in item -%}\n {%- if item[\"format\"] == param[\"oneOf\"][-1][\"format\"] -%}\n {{ item[\"format\"] }}\n {%- else -%}\n {{ item[\"format\"] + \" or \"}}\n {%- endif -%}\n {%- endif -%}\n {%- endfor -%}\n {%- else -%}\n {{ \"<|NONE|>\" }}\n {%- endif -%}\n{%- endmacro -%}\n\n{%- macro get_param_info(param) -%}\n {%- set param_type = param.get(\"type\", \"any\") -%}\n {%- set format_param = get_format_param(param) -%}\n\n {%- if \"description\" in param or \"default\" in param or format_param != \"<|NONE|>\" or param[\"maximum\"] or param[\"minimum\"] or param[\"maxLength\"] or param[\"minLength\"] -%}\n {{ \"//\" }}\n {%- if \"description\" in param -%}\n {%- set desc = param[\"description\"] -%}\n {%- if not desc.endswith(\".\") -%}\n {%- set desc = desc + \".\" -%}\n {%- endif -%}\n {{ \" \" + desc }}\n {%- endif -%}\n\n {%- if \"default\" in param -%}\n {%- set default_value = param[\"default\"] -%}\n {%- if param_type == \"string\" -%}\n {%- set default_value = '\"' ~ default_value ~ '\"' -%}\n {%- endif -%}\n {{ \" Default=\" ~ default_value ~ \".\" }}\n {%- endif -%}\n\n {%- set format_param = get_format_param(param) -%}\n {%- if format_param != \"<|NONE|>\" -%}\n {{ \" Format=\" ~ format_param }}\n {%- endif -%}\n\n {%- for field, field_name in [(\"maximum\", \"Maximum\"), (\"minimum\", \"Minimum\"), (\"maxLength\", \"Maximum length\"), (\"minLength\", \"Minimum length\")] -%}\n {%- if field in param -%}\n {{ \" \" + field_name ~ \"=\" ~ param[field] }}\n {%- endif -%}\n {%- endfor -%}\n {%- else -%}\n {{ \"<|NONE|>\"}}\n {%- endif -%}\n{%- endmacro -%}\n\n{%- macro get_enum_option_str(enum_options) -%}\n {%- for v in enum_options -%}\n {%- if v is string -%}\n {{ '\"' + v + '\"' }}\n {%- else -%}\n {{ v }}\n {%- endif -%}\n {%- if enum_options|length > 0 and v != enum_options[-1] -%}\n {{ \" | \" }}\n {%- endif -%}\n {%- endfor -%}\n{%- endmacro -%}\n\n{%- macro get_array_typescript(param_name, param_dic, depth) -%}\n {%- set offset = '' -%}\n {%- if depth >= 1 -%}\n {%- set offset = \" \" * depth -%}\n {%- endif -%}\n {%- set items_info = param_dic.get('items', {}) -%}\n\n {%- if items_info|length == 0 -%}\n {%- if param_name -%}\n {{ \"\\n\" + offset + param_name + \": []\" }}\n {%- else -%}\n {{ \"\\n\" + offset + \"[]\" }}\n {%- endif -%}\n {%- else -%}\n {%- set array_type = get_param_type(items_info) -%}\n {%- if array_type == 'object' -%}\n {%- if param_name -%}\n {{ \"\\n\" + offset + param_name + \": {\" }}\n {%- else -%}\n {{ \"\\n\" + offset + \"{\" }}\n {%- endif -%}\n {{ get_parameter_typescript(items_info.get('properties', {}), items_info.get('required', []), depth + 1) -}}\n {{- \"\\n\" + offset + \"}[]\" }}\n {%- elif array_type == 'array' -%}\n {%- set item_info = get_array_typescript(None, items_info, depth + 1) -%}\n {%- if not param_name -%}\n {{ \"\\n\" + item_info + \"[]\" }}\n {%- else -%}\n {{ \"\\n\" + offset + param_name + \": \" + item_info|trim + \"[]\" }}\n {%- endif -%}\n {%- else -%}\n {%- if 'enum' in items_info -%}\n {%- set item_type = get_enum_option_str(items_info['enum']) -%}\n {%- if param_name is none -%}\n {{ \"(\" + item_type + \")[]\"}}\n {%- else -%}\n {{ \"\\n\" + offset + param_name + \": (\" + item_type + \")[]\" }}\n {%- endif -%}\n {%- else -%}\n {%- if param_name is none -%}\n {{ \"\\n\" + array_type + \"[]\" }}\n {%- else -%}\n {{ \"\\n\" + offset + param_name + \": \" + array_type + \"[],\" }}\n {%- endif -%}\n {%- endif -%}\n {%- endif -%}\n {%- endif -%}\n{%- endmacro -%}\n\n{%- macro get_parameter_typescript(properties, required_params, depth=0) -%}\n {%- set res = \"\" -%}\n {%- for param_name, param in properties.items() -%}\n {%- if param is mapping -%}\n {%- set comment_info = get_param_info(param) -%}\n {# Param Examples #}\n {%- set examples_info = [] -%}\n {%- if \"examples\" in param -%}\n {%- set examples_info = [\"Example \" + param_name + \":\"] -%}\n {%- set examples_info = examples_info + param[\"examples\"] -%}\n {%- endif -%}\n\n {# Param Name declaration #}\n {%- set param_declaration = param_name -%}\n {%- if required_params is iterable and param_name not in required_params -%}\n {%- set param_declaration = param_declaration + \"?\" -%}\n {%- endif -%}\n\n {%- set param_type = get_param_type(param) -%}\n\n {# Handle indentation based on depth #}\n {%- set offset = \"\" -%}\n {%- if depth >= 1 -%}\n {%- set offset = \" \" * depth -%}\n {%- endif -%}\n\n {%- if param_type == \"object\" -%}\n {%- if comment_info != \"<|NONE|>\" -%}\n {{ \"\\n\" + offset + comment_info }}\n {%- endif -%}\n {%- if examples_info|length > 0 -%}\n {%- for example in examples_info -%}\n {{ \"\\n\" + offset + \"// \" + example|string|replace(\"'\", '\"') }}\n {%- endfor -%}\n {%- endif -%}\n {%- set param_declaration = param_declaration + \": {\" -%}\n {{ \"\\n\" + offset + param_declaration -}}\n {{- get_parameter_typescript(param.get(\"properties\", {}), param.get(\"required\", []), depth + 1) -}}\n {{- \"\\n\" + offset + \"},\" }}\n {%- elif param_type == \"array\" -%}\n {%- set item_info = param.get(\"items\", {}) -%}\n {%- if \"type\" not in item_info -%}\n {%- set param_declaration = param_declaration + \": [],\" -%}\n {{ append_new_param_info(param_declaration, comment_info, examples_info, depth) }}\n {%- else -%}\n {%- if comment_info != \"<|NONE|>\" -%}\n {{ \"\\n\" + offset + comment_info }}\n {%- endif -%}\n {%- if examples_info|length > 0 -%}\n {%- for example in examples_info -%}\n {{ \"\\n\" + offset + \"// \" + example|string|replace(\"'\", '\"') }}\n {%- endfor -%}\n {%- endif -%}\n {%- set array_declaration = get_array_typescript(param_declaration, param, depth) -%}\n {%- if not array_declaration.endswith(\",\") -%}\n {%- set array_declaration = array_declaration + \",\" -%}\n {%- endif -%}\n {{ array_declaration}}\n {%- endif -%}\n {%- else -%}\n {%- if \"enum\" in param -%}\n {%- set param_type = get_enum_option_str(param[\"enum\"]) -%}\n {%- endif -%}\n {%- if \"nullable\" in param and param[\"nullable\"] -%}\n {%- set param_type = param_type + \" | null\" -%}\n {%- endif -%}\n {%- set param_declaration = param_declaration + \": \" + param_type + \",\" -%}\n {{ append_new_param_info(param_declaration, comment_info, examples_info, depth) }}\n {%- endif -%}\n {%- endif -%}\n {%- endfor -%}\n{%- endmacro -%}\n\n{%- macro generate_schema_from_functions(functions, namespace='functions') -%}\n {{ \"// Supported function definitions that should be called when necessary.\\n\" -}}\n {{- \"namespace \" + namespace + \" {\\n\\n\" -}}\n\n {%- for function in functions -%}\n {%- if function.get(\"function\") -%}\n {%- set function = function.get(\"function\") -%}\n {%- endif -%}\n\n {%- set function_name = function.get(\"name\") -%}\n {%- if function_name -%}\n {%- set description = function.get('description', '') -%}\n {%- set parameters = function.get('parameters', {}) -%}\n {{- \"// \" + description + \"\\n\" -}}\n {{- \"type \" + function_name -}}\n {%- if parameters and parameters.get(\"properties\") -%}\n {{- \" = (_: {\" -}}\n {%- set required_params = parameters.get(\"required\", []) -%}\n {{ get_parameter_typescript(parameters.get(\"properties\"), required_params, 0) -}}\n {{- \"\\n}) => any;\\n\\n\" }}\n {%- else -%}\n {{ \" = () => any;\\n\\n\" }}\n {%- endif -%}\n {%- endif -%}\n {%- endfor -%}\n {{ \"} // namespace \" + namespace }}\n{%- endmacro -%}\n\n{%- if not tools is defined -%}\n {%- set tools = none -%}\n{%- endif -%}\n\n{%- set has_code_interpreter = tools | selectattr(\"type\", \"equalto\", \"code_interpreter\") | list | length > 0 -%}\n{%- if has_code_interpreter -%}\n {%- set tools = tools | rejectattr(\"type\", \"equalto\", \"code_interpreter\") | list -%}\n{%- endif -%}\n\n{#- System message + builtin tools #}\n{{- bos_token + \"<|start_header_id|>system<|end_header_id|>\\n\\n\" }}\n{%- if has_code_interpreter %}\n {{- \"Environment: ipython\\n\\n\" }}\n{%- else -%}\n {{ \"\"}}\n{%- endif %}\n{%- if tools %}\n {{- \"\\nYou have access to the following functions:\\n\\n\" }}\n {%- for t in tools %}\n {%- if \"type\" in t -%}\n {{ \"Use the function '\" + t[\"function\"][\"name\"] + \"' to '\" + t[\"function\"][\"description\"] + \"'\\n\" + t[\"function\"] | tojson() }}\n {%- else -%}\n {{ \"Use the function '\" + t[\"name\"] + \"' to '\" + t[\"description\"] + \"'\\n\" + t | tojson }}\n {%- endif -%}\n {{- \"\\n\\n\" }}\n {%- endfor %}\n {{- '\\nThink very carefully before calling functions.\\nIf a you choose to call a function ONLY reply in the following format:\\n<{start_tag}={function_name}>{parameters}{end_tag}\\nwhere\\n\\nstart_tag => ` a JSON dict with the function argument name as key and function argument value as value.\\nend_tag => ``\\n\\nHere is an example,\\n{\"example_name\": \"example_value\"}\\n\\nReminder:\\n- If looking for real time information use relevant functions before falling back to brave_search\\n- Function calls MUST follow the specified format, start with \\n- Required parameters MUST be specified\\n- Only call one function at a time\\n- Put the entire function call reply on one line\\n\\n' -}}\n{%- endif %}\n{{- \"<|eot_id|>\" -}}\n\n{%- for message in messages -%}\n {%- if message['role'] == 'user' or message['role'] == 'system' -%}\n {{ '<|start_header_id|>' + message['role'] + '<|end_header_id|>\\n\\n' + message['content'] + '<|eot_id|>' }}\n {%- elif message['role'] == 'tool' -%}\n {{ '<|start_header_id|>ipython<|end_header_id|>\\n\\n' + message['content'] + '<|eot_id|>' }}\n {%- else -%}\n {%- if (message['content'] and message['content']|length > 0) or ('tool_calls' in message and message['tool_calls'] and message['tool_calls']|length > 0) -%}\n {{ '<|start_header_id|>' + message['role'] + '<|end_header_id|>\\n\\n'}}\n {%- endif -%}\n {%- if message['content'] and message['content']|length > 0 -%}\n {{ message['content'] }}\n {%- endif -%}\n {%- if 'tool_calls' in message and message['tool_calls'] and message['tool_calls']|length > 0 -%}\n {%- for tool_call in message['tool_calls'] -%}\n {%- if tool_call[\"function\"][\"name\"] == \"python\" -%}\n {{ '<|python_tag|>' + tool_call['function']['arguments'] }}\n {%- else -%}\n {{ '' + tool_call['function']['arguments'] + '' }}\n {%- endif -%}\n {%- endfor -%}\n {{ '<|eom_id|>' }}\n {%- elif message['content'] and message['content']|length > 0 -%}\n {{ '<|eot_id|>' }}\n {%- endif -%}\n {%- endif -%}\n{%- endfor -%}\n{%- if add_generation_prompt -%}\n {{ '<|start_header_id|>assistant<|end_header_id|>\\n\\n' }}\n{%- endif -%}\n", + "clean_up_tokenization_spaces": false, + "eos_token": "<|eot_id|>", + "extra_special_tokens": {}, + "max_length": 8192, + "model_input_names": [ + "input_ids", + "attention_mask" + ], + "model_max_length": 1000000000000000019884624838656, + "pad_token": "<|end_of_text|>", + "stride": 0, + "tokenizer_class": "PreTrainedTokenizer", + "truncation_side": "right", + "truncation_strategy": "longest_first" +}