初始化项目，由ModelHub XC社区提供模型

Model: Fengshenbang/Ziya-LLaMA-13B-v1.1 Source: Original Platform
2026-05-25 16:25:14 +08:00
commit 89c333fe7b
40 changed files with 373 additions and 0 deletions
--- a/.gitattributes
+++ b/.gitattributes
@@ -0,0 +1,32 @@
+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bin.* filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zstandard filter=lfs diff=lfs merge=lfs -text
+*.tfevents* filter=lfs diff=lfs merge=lfs -text
+*.db* filter=lfs diff=lfs merge=lfs -text
+*.ark* filter=lfs diff=lfs merge=lfs -text
+**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text
+**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text
+**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text
--- a/README.md
+++ b/README.md
@@ -0,0 +1,79 @@
+---
+license: GPL-3.0
+tasks:
+- text-generation
+language:
+- en
+- zh
+
+studios:
+- Fengshenbang/Ziya_LLaMA_13B_v1_online
+
+---
+
+
+# Ziya-LLaMA-13B-v1.1
+
+- Main Page:[Fengshenbang](https://fengshenbang-lm.com/)
+- Github: [Fengshenbang-LM](https://github.com/IDEA-CCNL/Fengshenbang-LM)
+
+
+# 姜子牙系列模型
+- [Ziya-LLaMA-13B-v1.1](https://modelscope.cn/models/Fengshenbang/Ziya-LLaMA-13B-v1.1)
+- [Ziya-LLaMA-13B-v1](https://modelscope.cn/models/Fengshenbang/Ziya-LLaMA-13B-v1/summary)
+- [Ziya-LLaMA-7B-Reward](https://huggingface.co/IDEA-CCNL/Ziya-LLaMA-7B-Reward)
+- [Ziya-LLaMA-13B-Pretrain-v1](https://huggingface.co/IDEA-CCNL/Ziya-LLaMA-13B-Pretrain-v1)
+- [Ziya-BLIP2-14B-Visual-v1](https://modelscope.cn/models/Fengshenbang/Ziya-BLIP2-14B-Visual-v1/summary)
+
+## 简介 Brief Introduction
+我们对Ziya-LLaMA-13B-v1模型进行继续优化，推出开源版本Ziya-LLaMA-13B-v1.1。通过调整微调数据的比例和采用更优的强化学习策略，本版本在问答准确性、数学能力以及安全性等方面得到了提升，详细能力分析如下图所示。
+
+We have further optimized the Ziya-LLaMA-13B-v1 model and released the open-source version Ziya-LLaMA-13B-v1.1. By adjusting the proportion of fine-tuning data and adopting a better reinforcement learning strategy, this version has achieved improvements in question-answering accuracy, mathematical ability, and safety, as shown in the following figure in detail.
+
+<img src="https://huggingface.co/IDEA-CCNL/Ziya-LLaMA-13B-v1.1/resolve/main/pk.png" width=1000 height=600>
+
+## 软件依赖
+```
+pip install torch==1.12.1 tokenizers==0.13.3 git+https://github.com/huggingface/transformers
+```
+## <span id="jump"> 使用 Usage </span>
+```
+from modelscope.utils.constant import Tasks
+from modelscope.pipelines import pipeline
+pipe = pipeline(task=Tasks.text_generation, model='Fengshenbang/Ziya-LLaMA-13B-v1.1', model_revision='v1.0.2', device='cuda')
+query="帮我写一份去西安的旅游计划"
+inputs = '<human>:' + query.strip() + '\n<bot>:'
+result = pipe(inputs)
+print(result)
+
+```
+
+
+
+## 引用 Citation
+
+如果您在您的工作中使用了我们的模型，可以引用我们的[论文](https://arxiv.org/abs/2210.08590)：
+
+If you are using the resource for your work, please cite the our [paper](https://arxiv.org/abs/2210.08590):
+
+```text
+@article{fengshenbang,
+  author    = {Jiaxing Zhang and Ruyi Gan and Junjie Wang and Yuxiang Zhang and Lin Zhang and Ping Yang and Xinyu Gao and Ziwei Wu and Xiaoqun Dong and Junqing He and Jianheng Zhuo and Qi Yang and Yongfeng Huang and Xiayu Li and Yanghan Wu and Junyu Lu and Xinyu Zhu and Weifeng Chen and Ting Han and Kunhao Pan and Rui Wang and Hao Wang and Xiaojun Wu and Zhongshen Zeng and Chongpei Chen},
+  title     = {Fengshenbang 1.0: Being the Foundation of Chinese Cognitive Intelligence},
+  journal   = {CoRR},
+  volume    = {abs/2209.02970},
+  year      = {2022}
+}
+```
+
+You can also cite our [website](https://github.com/IDEA-CCNL/Fengshenbang-LM/):
+
+欢迎引用我们的[网站](https://github.com/IDEA-CCNL/Fengshenbang-LM/):
+```text
+@misc{Fengshenbang-LM,
+  title={Fengshenbang-LM},
+  author={IDEA-CCNL},
+  year={2021},
+  howpublished={\url{https://github.com/IDEA-CCNL/Fengshenbang-LM}},
+}
+```
--- a/added_tokens.json
+++ b/added_tokens.json
@@ -0,0 +1,4 @@
+{
+  "<bot>": 39409,
+  "<human>": 39408
+}
--- a/config.json
+++ b/config.json
@@ -0,0 +1,23 @@
+{
+  "_name_or_path": "/cognitive_comp/wanghao/models/llama_sft/llama_13B_v2_S2.2_S3_S3.1_rlhf_0601_RM13B0525_step44_hf/",
+  "architectures": [
+    "LlamaForCausalLM"
+  ],
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "hidden_act": "silu",
+  "hidden_size": 5120,
+  "initializer_range": 0.02,
+  "intermediate_size": 13824,
+  "max_position_embeddings": 2048,
+  "model_type": "llama",
+  "num_attention_heads": 40,
+  "num_hidden_layers": 40,
+  "pad_token_id": 0,
+  "rms_norm_eps": 1e-06,
+  "tie_word_embeddings": false,
+  "torch_dtype": "float16",
+  "transformers_version": "4.29.0.dev0",
+  "use_cache": true,
+  "vocab_size": 39424
+}
--- a/configuration.json
+++ b/configuration.json
@@ -0,0 +1,11 @@
+{
+    "framework": "pytorch",
+    "task": "text-generation",
+    "model": {
+        "type": "Ziya-LLaMA-13B-v1"
+    },
+    "pipeline": {
+        "type": "Ziya-LLaMA-13B-v1-text-generation-pipe"
+    },
+    "allow_remote": true
+}
--- a/generation_config.json
+++ b/generation_config.json
@@ -0,0 +1,7 @@
+{
+  "_from_model_config": true,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "pad_token_id": 0,
+  "transformers_version": "4.29.0.dev0"
+}
--- a/ms_wrapper.py
+++ b/ms_wrapper.py
@@ -0,0 +1,67 @@
+import os
+from typing import Union, Dict, Any
+from modelscope.pipelines.builder import PIPELINES
+from modelscope.models.builder import MODELS
+from modelscope.utils.constant import Tasks
+from modelscope.pipelines.base import Pipeline
+from modelscope.models.base import Model, TorchModel
+from modelscope.utils.logger import get_logger
+from transformers import AutoModelForCausalLM, AutoTokenizer
+from transformers import LlamaForCausalLM
+
+if 'CUDA_VISIBLE_DEVICES' not in os.environ:
+    os.environ['CUDA_VISIBLE_DEVICES'] = '0'
+
+
+
+@PIPELINES.register_module(Tasks.text_generation, module_name='Ziya-LLaMA-13B-v1-text-generation-pipe')
+class ZiyaLLaMA13Bv1TextGenerationPipeline(Pipeline):
+    def __init__(
+            self,
+            model: Union[Model, str],
+            *args,
+            **kwargs):
+        model = ZiyaLLaMA13Bv1TextGeneration(model) if isinstance(model, str) else model
+        super().__init__(model=model, **kwargs)
+    
+    def preprocess(self, inputs, **preprocess_params) -> Dict[str, Any]:
+        return inputs
+    
+    # define the forward pass
+    def forward(self, inputs: Dict, **forward_params) -> Dict[str, Any]:
+        return self.model(inputs)
+    
+    # format the outputs from pipeline
+    def postprocess(self, input, **kwargs) -> Dict[str, Any]:
+        return input
+
+
+
+@MODELS.register_module(Tasks.text_generation, module_name='Ziya-LLaMA-13B-v1')
+class ZiyaLLaMA13Bv1TextGeneration(TorchModel):
+    def __init__(self, model_dir=None, *args, **kwargs):
+        super().__init__(model_dir, *args, **kwargs)
+        self.logger = get_logger()
+        # loading tokenizer
+        self.tokenizer = AutoTokenizer.from_pretrained(model_dir)
+        self.model = LlamaForCausalLM.from_pretrained(model_dir, device_map="auto")
+        self.model = self.model.eval()
+    
+    def forward(self,input: Dict) -> Dict[str, Any]:
+        output = {}
+        res = self.infer(input)
+        output['text'] = res
+        return output
+    
+    def quantize(self, bits: int):
+        self.model = self.model.quantize(bits)
+        return self
+    
+    def infer(self, input):
+        device = self.model.device
+        input_ids = self.tokenizer(input, return_tensors="pt").input_ids.to(device)
+        logits = self.model.generate(input_ids, max_new_tokens=1024, do_sample = True, 
+                                     top_p = 0.85, temperature = 1.0, repetition_penalty=1.,
+                                     eos_token_id=2,bos_token_id=1,pad_token_id=0)
+        out = self.tokenizer.batch_decode(logits)[0]
+        return out
--- a/pk.png
+++ b/pk.png
--- a/pytorch_model-00001-of-00028.bin
+++ b/pytorch_model-00001-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e38683c5ea691cb0ae75bd15c5f3f059b5af559084569f53b7650c334dbba5f2
+size 896534991
--- a/pytorch_model-00002-of-00028.bin
+++ b/pytorch_model-00002-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b340ee8c36cf345ec05313eb538656945798c81aa7455fb543816d136c20753d
+size 985707823
--- a/pytorch_model-00003-of-00028.bin
+++ b/pytorch_model-00003-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:766dfaf59c5131b868148f24a4c809ed6e115950e54b99067cda83b4b6455ad1
+size 917528001
--- a/pytorch_model-00004-of-00028.bin
+++ b/pytorch_model-00004-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f3dae93f62b033700fee2dc87c49d2d7e62cc28dc037d73a369f88b9b65ecc6b
+size 985707823
--- a/pytorch_model-00005-of-00028.bin
+++ b/pytorch_model-00005-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8ba69524024bdff7da885fd7a03fac6f155393f49f158ffee2c1c107423eb71b
+size 917528001
--- a/pytorch_model-00006-of-00028.bin
+++ b/pytorch_model-00006-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:04e189dfc68405bb9f3db09f3eab7625b5e910aff95d099e81d7945dce2ecded
+size 985707823
--- a/pytorch_model-00007-of-00028.bin
+++ b/pytorch_model-00007-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:324e3511699012c539ef6147542e7dc02e6d0299bad720dae4b6d356aa4e3607
+size 917528001
--- a/pytorch_model-00008-of-00028.bin
+++ b/pytorch_model-00008-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8bc63c615d088a118f94150b92cf0bd9c05ebce6db9b268703b9a0d883c1172c
+size 985707823
--- a/pytorch_model-00009-of-00028.bin
+++ b/pytorch_model-00009-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0321aa53ca25f671730d430e467a838d9e0bf7750d32e5b41e9c272ab7aeddaf
+size 917528001
--- a/pytorch_model-00010-of-00028.bin
+++ b/pytorch_model-00010-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:af43d0f5fba3fb49587b139077d8de090dd45031cc82a4d8734d28f5d7e1cd39
+size 985707823
--- a/pytorch_model-00011-of-00028.bin
+++ b/pytorch_model-00011-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:876126243e1bbd4bcd70805374b3e312fe6e7a1663b67d85175ee510193e717b
+size 917528001
--- a/pytorch_model-00012-of-00028.bin
+++ b/pytorch_model-00012-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a61eff9376f5957c5fe42ea4a50884589f0c2b7571c184ebd862c964b65b370e
+size 985707823
--- a/pytorch_model-00013-of-00028.bin
+++ b/pytorch_model-00013-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e791930766b21f12ae62c698d9cf4cc70e80d0cb75e0e43236b04970317909c4
+size 917528001
--- a/pytorch_model-00014-of-00028.bin
+++ b/pytorch_model-00014-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ef188d54af85e3a64583033c6e46d9d8da988da0ec1a439bb5e4e93f98fcbec5
+size 985707823
--- a/pytorch_model-00015-of-00028.bin
+++ b/pytorch_model-00015-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5873cfb977b925c00cbd36f5ab23fc97c3c2001e3b3edd050550de7ea69b4d17
+size 917528001
--- a/pytorch_model-00016-of-00028.bin
+++ b/pytorch_model-00016-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:89221e84bf635fa868df498ddc2deabaee6f355bbe198cc56b7985a2c9dc8e65
+size 985707823
--- a/pytorch_model-00017-of-00028.bin
+++ b/pytorch_model-00017-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:007cb822dce729d63b378e55831bcd7d63c34cdfbc9ea73ec4162a89a77e50c6
+size 917528001
--- a/pytorch_model-00018-of-00028.bin
+++ b/pytorch_model-00018-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0deb620e5b18bf2a4ed73010877dc4b6400bbf4c214a8fbe0be5ea0b85067eb2
+size 985707823
--- a/pytorch_model-00019-of-00028.bin
+++ b/pytorch_model-00019-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be386fe1cb540d304a3c3c593fdd71952da98e6e539294f30acf7c02166287d8
+size 917528001
--- a/pytorch_model-00020-of-00028.bin
+++ b/pytorch_model-00020-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b7df2b424a382a241ebd68b901db3795ad869501fbf8a21855918455104abebc
+size 985707823
--- a/pytorch_model-00021-of-00028.bin
+++ b/pytorch_model-00021-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2a929861d68ca3924a326e32f97f0b42cafd3b59ffddca4d8eb864da1f504205
+size 917528001
--- a/pytorch_model-00022-of-00028.bin
+++ b/pytorch_model-00022-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:43cc16d8db3d1f5ab9efb615e4afe7427d656948a3b04c59cce2527c0f3dd5a8
+size 985707823
--- a/pytorch_model-00023-of-00028.bin
+++ b/pytorch_model-00023-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:73cf6e8aeee34899d2e962fc6433ba08174220303fd92cd51980f1affcfd8883
+size 917528001
--- a/pytorch_model-00024-of-00028.bin
+++ b/pytorch_model-00024-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2d5070b88d0c6b467f36e4060eaf8ccf36eee269d489813a7e3f3c4df3a2e556
+size 985707823
--- a/pytorch_model-00025-of-00028.bin
+++ b/pytorch_model-00025-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fa00813562f79aa9bb5ad0a0d04f2a8ad7409d298180568432ec4a4da2a7d768
+size 917528001
--- a/pytorch_model-00026-of-00028.bin
+++ b/pytorch_model-00026-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:062d05043f5923592e56c642417702bcd99082960bba3b24dbc8b1d2c947b970
+size 985707823
--- a/pytorch_model-00027-of-00028.bin
+++ b/pytorch_model-00027-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:434f427c34596366b531a4438e71123c401b18421d3a4d0444468484f4b5763e
+size 917528001
--- a/pytorch_model-00028-of-00028.bin
+++ b/pytorch_model-00028-of-00028.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:569b67b362ddb717b858d336b592ecd6136228950a824050a2d61e17180829fd
+size 545291867
--- a/pytorch_model.bin.index.json
+++ b/pytorch_model.bin.index.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dd2aeaa1baf2bcc094dfe61143c5f49147d8ba1cba70d1182d9f4bd732caf86c
+size 33444
--- a/special_tokens_map.json
+++ b/special_tokens_map.json
@@ -0,0 +1,27 @@
+{
+  "additional_special_tokens": [
+    "<human>",
+    "<bot>"
+  ],
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}
--- a/tokenizer.model
+++ b/tokenizer.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6fd7e445833dd0889206aba242c2a51ecbae2437fd328d1759a35475fd8c0423
+size 588619
--- a/tokenizer_config.json
+++ b/tokenizer_config.json
@@ -0,0 +1,33 @@
+{
+  "add_bos_token": true,
+  "add_eos_token": false,
+  "bos_token": {
+    "__type": "AddedToken",
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "clean_up_tokenization_spaces": false,
+  "eos_token": {
+    "__type": "AddedToken",
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": null,
+  "sp_model_kwargs": {},
+  "tokenizer_class": "LlamaTokenizer",
+  "unk_token": {
+    "__type": "AddedToken",
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}