From 80e9c175f61e2fb7876356d86494d0c85946a9fb Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sat, 16 May 2026 01:02:38 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: shaowenchen/longchat-13b-16k-gguf Source: Original Platform --- .gitattributes | 36 ++++++++++++++++++++ README.md | 64 ++++++++++++++++++++++++++++++++++++ configuration.json | 10 ++++++ longchat-13b-16k.Q2_K.gguf | 3 ++ longchat-13b-16k.Q3_K.gguf | 3 ++ longchat-13b-16k.Q3_K_L.gguf | 3 ++ longchat-13b-16k.Q3_K_S.gguf | 3 ++ longchat-13b-16k.Q4_0.gguf | 3 ++ longchat-13b-16k.Q4_1.gguf | 3 ++ longchat-13b-16k.Q4_K.gguf | 3 ++ longchat-13b-16k.Q4_K_S.gguf | 3 ++ longchat-13b-16k.Q5_0.gguf | 3 ++ longchat-13b-16k.Q5_1.gguf | 3 ++ longchat-13b-16k.Q5_K.gguf | 3 ++ longchat-13b-16k.Q5_K_S.gguf | 3 ++ longchat-13b-16k.Q6_K.gguf | 3 ++ longchat-13b-16k.Q8_0.gguf | 3 ++ longchat-13b-16k.gguf | 3 ++ 18 files changed, 155 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 configuration.json create mode 100644 longchat-13b-16k.Q2_K.gguf create mode 100644 longchat-13b-16k.Q3_K.gguf create mode 100644 longchat-13b-16k.Q3_K_L.gguf create mode 100644 longchat-13b-16k.Q3_K_S.gguf create mode 100644 longchat-13b-16k.Q4_0.gguf create mode 100644 longchat-13b-16k.Q4_1.gguf create mode 100644 longchat-13b-16k.Q4_K.gguf create mode 100644 longchat-13b-16k.Q4_K_S.gguf create mode 100644 longchat-13b-16k.Q5_0.gguf create mode 100644 longchat-13b-16k.Q5_1.gguf create mode 100644 longchat-13b-16k.Q5_K.gguf create mode 100644 longchat-13b-16k.Q5_K_S.gguf create mode 100644 longchat-13b-16k.Q6_K.gguf create mode 100644 longchat-13b-16k.Q8_0.gguf create mode 100644 longchat-13b-16k.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..e79ce6a --- /dev/null +++ b/.gitattributes @@ -0,0 +1,36 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +*.gguf filter=lfs diff=lfs merge=lfs -text \ No newline at end of file diff --git a/README.md b/README.md new file mode 100644 index 0000000..ca8c196 --- /dev/null +++ b/README.md @@ -0,0 +1,64 @@ +--- +inference: true +language: + - zh + - en +license: other +model_creator: lmsys +model_link: https://huggingface.co/lmsys/longchat-13b-16k +model_name: longchat-13b-16k +model_type: longchat +pipeline_tag: text-generation +quantized_by: shaowenchen +tasks: + - text2text-generation +tags: + - gguf + - longchat + - 13b + - 16k +--- + +## Provided files + +| Name | Quant method | Size | +| ---------------------------- | ------------ | ------ | +| longchat-13b-16k.Q2_K.gguf | Q2_K | 5.1 GB | +| longchat-13b-16k.Q3_K.gguf | Q3_K | 5.9 GB | +| longchat-13b-16k.Q3_K_L.gguf | Q3_K_L | 6.5 GB | +| longchat-13b-16k.Q3_K_S.gguf | Q3_K_S | 5.3 GB | +| longchat-13b-16k.Q4_0.gguf | Q4_0 | 6.9 GB | +| longchat-13b-16k.Q4_1.gguf | Q4_1 | 7.6 GB | +| longchat-13b-16k.Q4_K.gguf | Q4_K | 7.3 GB | +| longchat-13b-16k.Q4_K_S.gguf | Q4_K_S | 6.9 GB | +| longchat-13b-16k.Q5_0.gguf | Q5_0 | 8.4 GB | +| longchat-13b-16k.Q5_1.gguf | Q5_1 | 9.1 GB | +| longchat-13b-16k.Q5_K.gguf | Q5_K | 8.6 GB | +| longchat-13b-16k.Q5_K_S.gguf | Q5_K_S | 8.4 GB | +| longchat-13b-16k.Q6_K.gguf | Q6_K | 9.9 GB | +| longchat-13b-16k.Q8_0.gguf | Q8_0 | 13 GB | +| longchat-13b-16k.gguf | full | 24 GB | + +Usage: + +``` +docker run --rm -it -p 8000:8000 -v /path/to/models:/models -e MODEL=/models/gguf-model-name.gguf hubimage/llama-cpp-python:latest +``` + +and you can view http://localhost:8000/docs to see the swagger UI. + +## Provided images + +| Name | Quant method | Compressed Size | +| ---------------------------------------- | ------------ | --------------- | +| `shaowenchen/longchat-13b-16k-gguf:Q2_K` | Q2_K | 7.47 GB | +| `shaowenchen/longchat-13b-16k-gguf:Q3_K` | Q3_K | 6.11 GB | +| `shaowenchen/longchat-13b-16k-gguf:Q4_K` | Q4_K | 5.29 GB | + +Usage: + +``` +docker run --rm -p 8000:8000 shaowenchen/longchat-13b-16k-gguf:Q2_K +``` + +and you can view http://localhost:8000/docs to see the swagger UI. diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..86b0b11 --- /dev/null +++ b/configuration.json @@ -0,0 +1,10 @@ +{ + "framework": "pytorch", + "task": "text-generation", + "model": { + "type": "longchat" + }, + "pipeline": { + "type": "longchat-13b-16k-text-generation-pipe" + } +} \ No newline at end of file diff --git a/longchat-13b-16k.Q2_K.gguf b/longchat-13b-16k.Q2_K.gguf new file mode 100644 index 0000000..d3a6abf --- /dev/null +++ b/longchat-13b-16k.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3779d4febe1fd4e5121f5430529d6169537a9dee1596d2dcae34e5e5a3427c96 +size 5429348256 diff --git a/longchat-13b-16k.Q3_K.gguf b/longchat-13b-16k.Q3_K.gguf new file mode 100644 index 0000000..43cdc10 --- /dev/null +++ b/longchat-13b-16k.Q3_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee53e00448d89752aa49148bd57b858eff261ed434118ca7727ca51a68a773e7 +size 6337769376 diff --git a/longchat-13b-16k.Q3_K_L.gguf b/longchat-13b-16k.Q3_K_L.gguf new file mode 100644 index 0000000..f9b7bec --- /dev/null +++ b/longchat-13b-16k.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04a08d751fea3204d5c6cfecd723044f2075a8744614f4d16135006417b433d4 +size 6929559456 diff --git a/longchat-13b-16k.Q3_K_S.gguf b/longchat-13b-16k.Q3_K_S.gguf new file mode 100644 index 0000000..88f1d80 --- /dev/null +++ b/longchat-13b-16k.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e4b48f519062148ace72931413ee42718ff0e68a582091158607459a6cc77fb +size 5658980256 diff --git a/longchat-13b-16k.Q4_0.gguf b/longchat-13b-16k.Q4_0.gguf new file mode 100644 index 0000000..6496459 --- /dev/null +++ b/longchat-13b-16k.Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:962582bdae575684c7582f4a09b56aea457d35311951a6d3b87d921857f39610 +size 7365834656 diff --git a/longchat-13b-16k.Q4_1.gguf b/longchat-13b-16k.Q4_1.gguf new file mode 100644 index 0000000..4ecb990 --- /dev/null +++ b/longchat-13b-16k.Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:948ae04d504e19f404e5546700a6201b991c365a6d7f9d902338fc174ba52859 +size 8169060256 diff --git a/longchat-13b-16k.Q4_K.gguf b/longchat-13b-16k.Q4_K.gguf new file mode 100644 index 0000000..332ea90 --- /dev/null +++ b/longchat-13b-16k.Q4_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a24f1285c68523d46d7294f3195fb6822df6b7f711e91416b4efe7ed5edb168 +size 7865956256 diff --git a/longchat-13b-16k.Q4_K_S.gguf b/longchat-13b-16k.Q4_K_S.gguf new file mode 100644 index 0000000..785fe25 --- /dev/null +++ b/longchat-13b-16k.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13c6f9abdf28a325cf6847defb2cf9a9f3861b1c543f2436bc88fdac8d3865f3 +size 7414331296 diff --git a/longchat-13b-16k.Q5_0.gguf b/longchat-13b-16k.Q5_0.gguf new file mode 100644 index 0000000..74157c7 --- /dev/null +++ b/longchat-13b-16k.Q5_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75ed3167dba3650de6e674f93a5a7eb967deaff12876aaf4f2d714e614809114 +size 8972285856 diff --git a/longchat-13b-16k.Q5_1.gguf b/longchat-13b-16k.Q5_1.gguf new file mode 100644 index 0000000..4df6e40 --- /dev/null +++ b/longchat-13b-16k.Q5_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:415b20beb5f892ae5693c60d860bf1ab0135fa8c7b13aeaa0e22b07d3d576b97 +size 9775511456 diff --git a/longchat-13b-16k.Q5_K.gguf b/longchat-13b-16k.Q5_K.gguf new file mode 100644 index 0000000..90d7841 --- /dev/null +++ b/longchat-13b-16k.Q5_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9f08ddee15f174e6c4b6a23c3a7ea5b0b30cff96f589ae48e289b04575f9d3f +size 9229924256 diff --git a/longchat-13b-16k.Q5_K_S.gguf b/longchat-13b-16k.Q5_K_S.gguf new file mode 100644 index 0000000..2abf035 --- /dev/null +++ b/longchat-13b-16k.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3305af3855cd22764bb8e7762efc347d2c370441d9bcb2695fc219363def6eff +size 8972285856 diff --git a/longchat-13b-16k.Q6_K.gguf b/longchat-13b-16k.Q6_K.gguf new file mode 100644 index 0000000..79b7068 --- /dev/null +++ b/longchat-13b-16k.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8886457d379326cd9f0d2a061dcaba360ea7869a2ee78564985f004e28799c5d +size 10679140256 diff --git a/longchat-13b-16k.Q8_0.gguf b/longchat-13b-16k.Q8_0.gguf new file mode 100644 index 0000000..2bc9d37 --- /dev/null +++ b/longchat-13b-16k.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddb66e400abdf588d08d16c259de526008b763311b11e8feb65b3d3d5e2ac1e5 +size 13831319456 diff --git a/longchat-13b-16k.gguf b/longchat-13b-16k.gguf new file mode 100644 index 0000000..bc305cb --- /dev/null +++ b/longchat-13b-16k.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aa1b6a5d9da12433aadc247d92d112319af8f12c4df6ad0b6f439a969ed8e3a +size 26033303424