初始化项目,由ModelHub XC社区提供模型
Model: QuantFactory/LongWriter-llama3.1-8b-GGUF Source: Original Platform
This commit is contained in:
49
.gitattributes
vendored
Normal file
49
.gitattributes
vendored
Normal file
@@ -0,0 +1,49 @@
|
||||
*.7z filter=lfs diff=lfs merge=lfs -text
|
||||
*.arrow filter=lfs diff=lfs merge=lfs -text
|
||||
*.bin filter=lfs diff=lfs merge=lfs -text
|
||||
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
||||
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
||||
*.ftz filter=lfs diff=lfs merge=lfs -text
|
||||
*.gz filter=lfs diff=lfs merge=lfs -text
|
||||
*.h5 filter=lfs diff=lfs merge=lfs -text
|
||||
*.joblib filter=lfs diff=lfs merge=lfs -text
|
||||
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
||||
*.model filter=lfs diff=lfs merge=lfs -text
|
||||
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||
*.npy filter=lfs diff=lfs merge=lfs -text
|
||||
*.npz filter=lfs diff=lfs merge=lfs -text
|
||||
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||
*.parquet filter=lfs diff=lfs merge=lfs -text
|
||||
*.pb filter=lfs diff=lfs merge=lfs -text
|
||||
*.pickle filter=lfs diff=lfs merge=lfs -text
|
||||
*.pkl filter=lfs diff=lfs merge=lfs -text
|
||||
*.pt filter=lfs diff=lfs merge=lfs -text
|
||||
*.pth filter=lfs diff=lfs merge=lfs -text
|
||||
*.rar filter=lfs diff=lfs merge=lfs -text
|
||||
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
||||
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar filter=lfs diff=lfs merge=lfs -text
|
||||
*.tflite filter=lfs diff=lfs merge=lfs -text
|
||||
*.tgz filter=lfs diff=lfs merge=lfs -text
|
||||
*.wasm filter=lfs diff=lfs merge=lfs -text
|
||||
*.xz filter=lfs diff=lfs merge=lfs -text
|
||||
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||
LongWriter-llama3.1-8b.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
LongWriter-llama3.1-8b.Q4_1.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
LongWriter-llama3.1-8b.Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
LongWriter-llama3.1-8b.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
LongWriter-llama3.1-8b.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
LongWriter-llama3.1-8b.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
LongWriter-llama3.1-8b.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
LongWriter-llama3.1-8b.Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
LongWriter-llama3.1-8b.Q5_1.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
LongWriter-llama3.1-8b.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
LongWriter-llama3.1-8b.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
LongWriter-llama3.1-8b.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
LongWriter-llama3.1-8b.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
LongWriter-llama3.1-8b.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
3
LongWriter-llama3.1-8b.Q2_K.gguf
Normal file
3
LongWriter-llama3.1-8b.Q2_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:8e654df5fd98fadab1ab01a614de783f311d71b8b32a1bd4e9963b3e30eb1fa2
|
||||
size 3179131424
|
||||
3
LongWriter-llama3.1-8b.Q3_K_L.gguf
Normal file
3
LongWriter-llama3.1-8b.Q3_K_L.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:d1cb1e6ce1360adc90e4c9956e9421ee561458b2bbd7a107a484a008390e928c
|
||||
size 4321956384
|
||||
3
LongWriter-llama3.1-8b.Q3_K_M.gguf
Normal file
3
LongWriter-llama3.1-8b.Q3_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:2542e3806b0069523deedea36cb090566b490ff4cfd9dc59e7e538a524ed67e9
|
||||
size 4018917920
|
||||
3
LongWriter-llama3.1-8b.Q3_K_S.gguf
Normal file
3
LongWriter-llama3.1-8b.Q3_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:00ec0ed2f00fd534362607a98ce159d21dd2622c4ab41d28b9a37780019d5000
|
||||
size 3664499232
|
||||
3
LongWriter-llama3.1-8b.Q4_0.gguf
Normal file
3
LongWriter-llama3.1-8b.Q4_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:c92061b9d2a2e4f98391dc415de95a38d26007d88830389236ddd9f8b3281899
|
||||
size 4661211680
|
||||
3
LongWriter-llama3.1-8b.Q4_1.gguf
Normal file
3
LongWriter-llama3.1-8b.Q4_1.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:1ed1e8007557285fafde24255f96e009c5b6463a4f66361d20f62a8f9d3f25b4
|
||||
size 5130252832
|
||||
3
LongWriter-llama3.1-8b.Q4_K_M.gguf
Normal file
3
LongWriter-llama3.1-8b.Q4_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:2c70ec463165f414c62689dce52ca2cfc788c501d16917dc5e08dafea4d91dbf
|
||||
size 4920734240
|
||||
3
LongWriter-llama3.1-8b.Q4_K_S.gguf
Normal file
3
LongWriter-llama3.1-8b.Q4_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:718f988d8d721e2d6223d8814a154773286344093842f2a86abf421aede80db1
|
||||
size 4692668960
|
||||
3
LongWriter-llama3.1-8b.Q5_0.gguf
Normal file
3
LongWriter-llama3.1-8b.Q5_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:f79aa7ed50946a0d7a16d3117947699e1e23622a272c2d546f5c6c19eee70228
|
||||
size 5599293984
|
||||
3
LongWriter-llama3.1-8b.Q5_1.gguf
Normal file
3
LongWriter-llama3.1-8b.Q5_1.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:3e7eebc8e74ec71e7c189281f668b9d872a2e62a15b698fe6e67dd931fbeca06
|
||||
size 6068335136
|
||||
3
LongWriter-llama3.1-8b.Q5_K_M.gguf
Normal file
3
LongWriter-llama3.1-8b.Q5_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:d206872c19207b974d7826c076bbea22f8c25cc16c08ad77953d45624704c49c
|
||||
size 5732987424
|
||||
3
LongWriter-llama3.1-8b.Q5_K_S.gguf
Normal file
3
LongWriter-llama3.1-8b.Q5_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:837a6ec6056c1706f75a759749bdf11e52c73a31abb06d5d96b6b7c247088fe3
|
||||
size 5599293984
|
||||
3
LongWriter-llama3.1-8b.Q6_K.gguf
Normal file
3
LongWriter-llama3.1-8b.Q6_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:805cbb51ca02a0c6d44ac97924ee5b0bebbb7f742dbd345178b42a1b575d058a
|
||||
size 6596006432
|
||||
3
LongWriter-llama3.1-8b.Q8_0.gguf
Normal file
3
LongWriter-llama3.1-8b.Q8_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:98b0f8e426e94137bff7c371d5a09f6d65e74cceb4088301264c2758ca6b3211
|
||||
size 8540770848
|
||||
70
README.md
Normal file
70
README.md
Normal file
@@ -0,0 +1,70 @@
|
||||
|
||||
---
|
||||
|
||||
language:
|
||||
- en
|
||||
- zh
|
||||
library_name: transformers
|
||||
tags:
|
||||
- Long Context
|
||||
- chatglm
|
||||
- llama
|
||||
datasets:
|
||||
- THUDM/LongWriter-6k
|
||||
license: llama3.1
|
||||
|
||||
---
|
||||
|
||||

|
||||
|
||||
# QuantFactory/LongWriter-llama3.1-8b-GGUF
|
||||
This is quantized version of [THUDM/LongWriter-llama3.1-8b](https://huggingface.co/THUDM/LongWriter-llama3.1-8b) created using llama.cpp
|
||||
|
||||
# Original Model Card
|
||||
|
||||
# LongWriter-llama3.1-8b
|
||||
|
||||
<p align="center">
|
||||
🤗 <a href="https://huggingface.co/datasets/THUDM/LongWriter-6k" target="_blank">[LongWriter Dataset] </a> • 💻 <a href="https://github.com/THUDM/LongWriter" target="_blank">[Github Repo]</a> • 📃 <a href="https://arxiv.org/abs/2408.07055" target="_blank">[LongWriter Paper]</a>
|
||||
</p>
|
||||
|
||||
LongWriter-llama3.1-8b is trained based on [Meta-Llama-3.1-8B](https://huggingface.co/meta-llama/Meta-Llama-3.1-8B), and is capable of generating 10,000+ words at once.
|
||||
|
||||
|
||||
A simple demo for deployment of the model:
|
||||
```python
|
||||
from transformers import AutoTokenizer, AutoModelForCausalLM
|
||||
import torch
|
||||
tokenizer = AutoTokenizer.from_pretrained("THUDM/LongWriter-llama3.1-8b", trust_remote_code=True)
|
||||
model = AutoModelForCausalLM.from_pretrained("THUDM/LongWriter-llama3.1-8b", torch_dtype=torch.bfloat16, trust_remote_code=True, device_map="auto")
|
||||
model = model.eval()
|
||||
query = "Write a 10000-word China travel guide"
|
||||
prompt = f"[INST]{query}[/INST]"
|
||||
input = tokenizer(prompt, truncation=False, return_tensors="pt").to(device)
|
||||
context_length = input.input_ids.shape[-1]
|
||||
output = model.generate(
|
||||
**input,
|
||||
max_new_tokens=32768,
|
||||
num_beams=1,
|
||||
do_sample=True,
|
||||
temperature=0.5,
|
||||
)[0]
|
||||
response = tokenizer.decode(output[context_length:], skip_special_tokens=True)
|
||||
print(response)
|
||||
```
|
||||
Please ahere to the prompt template (system prompt is optional): `<<SYS>>\n{system prompt}\n<</SYS>>\n\n[INST]{query1}[/INST]{response1}[INST]{query2}[/INST]{response2}...`
|
||||
|
||||
License: [Llama-3.1 License](https://huggingface.co/meta-llama/Meta-Llama-3.1-8B/blob/main/LICENSE)
|
||||
|
||||
## Citation
|
||||
|
||||
If you find our work useful, please consider citing LongWriter:
|
||||
|
||||
```
|
||||
@article{bai2024longwriter,
|
||||
title={LongWriter: Unleashing 10,000+ Word Generation from Long Context LLMs},
|
||||
author={Yushi Bai and Jiajie Zhang and Xin Lv and Linzhi Zheng and Siqi Zhu and Lei Hou and Yuxiao Dong and Jie Tang and Juanzi Li},
|
||||
journal={arXiv preprint arXiv:2408.07055},
|
||||
year={2024}
|
||||
}
|
||||
```
|
||||
1
configuration.json
Normal file
1
configuration.json
Normal file
@@ -0,0 +1 @@
|
||||
{}
|
||||
Reference in New Issue
Block a user