commit a0699a27595f3cccf0bf49623d208d3f71ee6d3c Author: ModelHub XC Date: Fri Apr 10 10:52:56 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/XinYuan-Qwen2-7B-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..e75dbcc --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-Q4_0_4_4.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-Q4_0_4_8.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-Q4_0_8_8.gguf filter=lfs diff=lfs merge=lfs -text +XinYuan-Qwen2-7B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..3623ce8 --- /dev/null +++ b/README.md @@ -0,0 +1,79 @@ +--- +base_model: thomas-yanxin/XinYuan-Qwen2-7B +datasets: +- thomas-yanxin/MT-SFT-ShareGPT +language: +- zh +- en +library_name: transformers +license: other +quantized_by: mradermacher +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/thomas-yanxin/XinYuan-Qwen2-7B + + +static quants are available at https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-IQ1_S.gguf) | i1-IQ1_S | 2.0 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-IQ1_M.gguf) | i1-IQ1_M | 2.1 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 2.6 | | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-IQ2_S.gguf) | i1-IQ2_S | 2.7 | | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-IQ2_M.gguf) | i1-IQ2_M | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-Q2_K.gguf) | i1-Q2_K | 3.1 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 3.2 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 3.4 | | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 3.6 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-IQ3_S.gguf) | i1-IQ3_S | 3.6 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-IQ3_M.gguf) | i1-IQ3_M | 3.7 | | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 3.9 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 4.2 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 4.3 | | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-Q4_0_4_4.gguf) | i1-Q4_0_4_4 | 4.5 | fast on arm, low quality | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-Q4_0_4_8.gguf) | i1-Q4_0_4_8 | 4.5 | fast on arm+i8mm, low quality | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-Q4_0_8_8.gguf) | i1-Q4_0_8_8 | 4.5 | fast on arm+sve, low quality | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-Q4_0.gguf) | i1-Q4_0 | 4.5 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 4.6 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 4.8 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 5.4 | | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 5.5 | | +| [GGUF](https://huggingface.co/mradermacher/XinYuan-Qwen2-7B-i1-GGUF/resolve/main/XinYuan-Qwen2-7B.i1-Q6_K.gguf) | i1-Q6_K | 6.4 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/XinYuan-Qwen2-7B.i1-IQ1_M.gguf b/XinYuan-Qwen2-7B.i1-IQ1_M.gguf new file mode 100644 index 0000000..3da548c --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7c80f856c58240b8210d43e9b12da3c2b0d0fea9ae3aa5c447185a6fe6170e2 +size 2042194624 diff --git a/XinYuan-Qwen2-7B.i1-IQ1_S.gguf b/XinYuan-Qwen2-7B.i1-IQ1_S.gguf new file mode 100644 index 0000000..89f39ab --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3db4bcb6d297c67b7adfb47bd10226b08487764993a2e701787498041dbf8370 +size 1903665856 diff --git a/XinYuan-Qwen2-7B.i1-IQ2_M.gguf b/XinYuan-Qwen2-7B.i1-IQ2_M.gguf new file mode 100644 index 0000000..760db95 --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75994bc9a3ca2529cf54c96413dfcef95338b0efcfc1de6fdd5d79645cfec5a4 +size 2780340928 diff --git a/XinYuan-Qwen2-7B.i1-IQ2_S.gguf b/XinYuan-Qwen2-7B.i1-IQ2_S.gguf new file mode 100644 index 0000000..7861035 --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b18423bbf52f0754d6353729a54e31ca873f3ec897682c232fc04d2141788ab2 +size 2595635904 diff --git a/XinYuan-Qwen2-7B.i1-IQ2_XS.gguf b/XinYuan-Qwen2-7B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..866d8ae --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039db86b4888b6b7c71f2ec285a212e256c5c84b3cb67ff8f9e2c26d09dc7941 +size 2469020352 diff --git a/XinYuan-Qwen2-7B.i1-IQ2_XXS.gguf b/XinYuan-Qwen2-7B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..32d790a --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1e8df94c937fdd37ea352fa9a56872b798631b63f4ee6e60dd423e5d04829de +size 2273075904 diff --git a/XinYuan-Qwen2-7B.i1-IQ3_M.gguf b/XinYuan-Qwen2-7B.i1-IQ3_M.gguf new file mode 100644 index 0000000..a8856b0 --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f91cb4fdaf3432f11c85c5b7d9ba618b02d3572784c19627da4a2bbdadaaed2 +size 3574010560 diff --git a/XinYuan-Qwen2-7B.i1-IQ3_S.gguf b/XinYuan-Qwen2-7B.i1-IQ3_S.gguf new file mode 100644 index 0000000..bb62afe --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f57d5179f7cd6f20a86d9466e73019ac999f66330ec44ada397aa8ff03693d5 +size 3499190976 diff --git a/XinYuan-Qwen2-7B.i1-IQ3_XS.gguf b/XinYuan-Qwen2-7B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..1b37c4c --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae2293531499e2d5caf4abd69ca16a772038b125827eced0112db483981eafd5 +size 3346254528 diff --git a/XinYuan-Qwen2-7B.i1-IQ3_XXS.gguf b/XinYuan-Qwen2-7B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..8ff0f86 --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74a94379e4b437da1668ee7728d3398ae8cb3e53d1c4f1ae82da0224d56c65b2 +size 3114513088 diff --git a/XinYuan-Qwen2-7B.i1-IQ4_XS.gguf b/XinYuan-Qwen2-7B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..147179a --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51797cab527b671f521402e8db7128eb988a36c25278762de6844268770c9a4b +size 4218471104 diff --git a/XinYuan-Qwen2-7B.i1-Q2_K.gguf b/XinYuan-Qwen2-7B.i1-Q2_K.gguf new file mode 100644 index 0000000..7e07b27 --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30229bdcaffa34dc7ebecc7b5e8d4931cf6af0378f3a75fb3264aac521da2cfd +size 3015938752 diff --git a/XinYuan-Qwen2-7B.i1-Q3_K_L.gguf b/XinYuan-Qwen2-7B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..abc07fc --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2cd821410e8de5fbeff190a98e26256965e315332d6336fd46e8b8270b686f0 +size 4088457920 diff --git a/XinYuan-Qwen2-7B.i1-Q3_K_M.gguf b/XinYuan-Qwen2-7B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..e071437 --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11d758c2305b8b511605dac0252ecc63b40fbf98fdd0eae739d46cbaded5d58f +size 3808389824 diff --git a/XinYuan-Qwen2-7B.i1-Q3_K_S.gguf b/XinYuan-Qwen2-7B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..8b0aaa3 --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4381bd9c679c7acaea2862a337543167f6e923250161c5c41babff0e7ab0b12f +size 3492367040 diff --git a/XinYuan-Qwen2-7B.i1-Q4_0.gguf b/XinYuan-Qwen2-7B.i1-Q4_0.gguf new file mode 100644 index 0000000..913184b --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b80d276378b4a4b590a866277f969bad82094007116ac260e225d1f4f3498da0 +size 4444119744 diff --git a/XinYuan-Qwen2-7B.i1-Q4_0_4_4.gguf b/XinYuan-Qwen2-7B.i1-Q4_0_4_4.gguf new file mode 100644 index 0000000..5874a0c --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-Q4_0_4_4.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa1f78dffa1ad34a7995285eb3784f4f3f5e4db1d2431e09dc958ca49b448bca +size 4431389376 diff --git a/XinYuan-Qwen2-7B.i1-Q4_0_4_8.gguf b/XinYuan-Qwen2-7B.i1-Q4_0_4_8.gguf new file mode 100644 index 0000000..87aca1f --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-Q4_0_4_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0929b7659f18da349cd1b0326eebe7c6ce8b4dd4ef9b1f84b69c4889dda59dc +size 4431389376 diff --git a/XinYuan-Qwen2-7B.i1-Q4_0_8_8.gguf b/XinYuan-Qwen2-7B.i1-Q4_0_8_8.gguf new file mode 100644 index 0000000..063dc4f --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-Q4_0_8_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd9f9aa7d66f4b680f98b0d1707c7d225a8a88acb8dedc851c2db65c75c7c897 +size 4431389376 diff --git a/XinYuan-Qwen2-7B.i1-Q4_K_M.gguf b/XinYuan-Qwen2-7B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..e278963 --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0cae8c11e7d63e579bde3475b12aa0913c4d84495234afd45be184d9b30e951 +size 4683072192 diff --git a/XinYuan-Qwen2-7B.i1-Q4_K_S.gguf b/XinYuan-Qwen2-7B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..207eaea --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:479151336e839273eed208699a9018a5533fb98470462d284d99247e01516be9 +size 4457767616 diff --git a/XinYuan-Qwen2-7B.i1-Q5_K_M.gguf b/XinYuan-Qwen2-7B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..40dca8a --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6371c8c80cf830d28bbe9467bb02f49c4bb1fc148d64ea2867c3a8e75fcc1332 +size 5444829888 diff --git a/XinYuan-Qwen2-7B.i1-Q5_K_S.gguf b/XinYuan-Qwen2-7B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..a55f3dc --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75a4dad30a63aafb58c89fe07b55829328aba782979b1504d71426505d225016 +size 5315175104 diff --git a/XinYuan-Qwen2-7B.i1-Q6_K.gguf b/XinYuan-Qwen2-7B.i1-Q6_K.gguf new file mode 100644 index 0000000..e7ef269 --- /dev/null +++ b/XinYuan-Qwen2-7B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d99c88d98792141c1566a9cd9a8d0696f99c5c5d2165cb28ca710e8d121e4540 +size 6254197440 diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..c86cbbe --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f379dc268c8815d2c9bd5a676e6c842227ee05ba026e8afed2015531ced60ed8 +size 4536665