From c6fca6439bea90138a3864bb6fcaa93244f902d6 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Fri, 5 Jun 2026 22:18:17 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/QiMing-Holos-Plus-8B-i1-GGUF Source: Original Platform --- .gitattributes | 60 +++++++++++++++++ QiMing-Holos-Plus-8B.i1-IQ1_M.gguf | 3 + QiMing-Holos-Plus-8B.i1-IQ1_S.gguf | 3 + QiMing-Holos-Plus-8B.i1-IQ2_M.gguf | 3 + QiMing-Holos-Plus-8B.i1-IQ2_S.gguf | 3 + QiMing-Holos-Plus-8B.i1-IQ2_XS.gguf | 3 + QiMing-Holos-Plus-8B.i1-IQ2_XXS.gguf | 3 + QiMing-Holos-Plus-8B.i1-IQ3_M.gguf | 3 + QiMing-Holos-Plus-8B.i1-IQ3_S.gguf | 3 + QiMing-Holos-Plus-8B.i1-IQ3_XS.gguf | 3 + QiMing-Holos-Plus-8B.i1-IQ3_XXS.gguf | 3 + QiMing-Holos-Plus-8B.i1-IQ4_NL.gguf | 3 + QiMing-Holos-Plus-8B.i1-IQ4_XS.gguf | 3 + QiMing-Holos-Plus-8B.i1-Q2_K.gguf | 3 + QiMing-Holos-Plus-8B.i1-Q2_K_S.gguf | 3 + QiMing-Holos-Plus-8B.i1-Q3_K_L.gguf | 3 + QiMing-Holos-Plus-8B.i1-Q3_K_M.gguf | 3 + QiMing-Holos-Plus-8B.i1-Q3_K_S.gguf | 3 + QiMing-Holos-Plus-8B.i1-Q4_0.gguf | 3 + QiMing-Holos-Plus-8B.i1-Q4_1.gguf | 3 + QiMing-Holos-Plus-8B.i1-Q4_K_M.gguf | 3 + QiMing-Holos-Plus-8B.i1-Q4_K_S.gguf | 3 + QiMing-Holos-Plus-8B.i1-Q5_K_M.gguf | 3 + QiMing-Holos-Plus-8B.i1-Q5_K_S.gguf | 3 + QiMing-Holos-Plus-8B.i1-Q6_K.gguf | 3 + QiMing-Holos-Plus-8B.imatrix.gguf | 3 + README.md | 98 ++++++++++++++++++++++++++++ 27 files changed, 233 insertions(+) create mode 100644 .gitattributes create mode 100644 QiMing-Holos-Plus-8B.i1-IQ1_M.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-IQ1_S.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-IQ2_M.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-IQ2_S.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-IQ2_XS.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-IQ2_XXS.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-IQ3_M.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-IQ3_S.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-IQ3_XS.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-IQ3_XXS.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-IQ4_NL.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-IQ4_XS.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-Q2_K.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-Q2_K_S.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-Q3_K_L.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-Q3_K_M.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-Q3_K_S.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-Q4_0.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-Q4_1.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-Q4_K_M.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-Q4_K_S.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-Q5_K_M.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-Q5_K_S.gguf create mode 100644 QiMing-Holos-Plus-8B.i1-Q6_K.gguf create mode 100644 QiMing-Holos-Plus-8B.imatrix.gguf create mode 100644 README.md diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..5f9987b --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.imatrix.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +QiMing-Holos-Plus-8B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/QiMing-Holos-Plus-8B.i1-IQ1_M.gguf b/QiMing-Holos-Plus-8B.i1-IQ1_M.gguf new file mode 100644 index 0000000..2cbcdab --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bbfdfc6cfeb4e523ca70a2348582776cf750536fea2d7db922151b8376fdd2b +size 2161975072 diff --git a/QiMing-Holos-Plus-8B.i1-IQ1_S.gguf b/QiMing-Holos-Plus-8B.i1-IQ1_S.gguf new file mode 100644 index 0000000..c0b6ca4 --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fea5734b032f9c64413946b2427ddc58344808b7d191bbba6f20d0ef05d90105 +size 2019630880 diff --git a/QiMing-Holos-Plus-8B.i1-IQ2_M.gguf b/QiMing-Holos-Plus-8B.i1-IQ2_M.gguf new file mode 100644 index 0000000..eb57439 --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aede37897c9a56a9004c0d61cd5a43a342d6383abf772f8780ef536283280343 +size 2948284192 diff --git a/QiMing-Holos-Plus-8B.i1-IQ2_S.gguf b/QiMing-Holos-Plus-8B.i1-IQ2_S.gguf new file mode 100644 index 0000000..c0489b7 --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96e16cef31118fa1691a269a61823c4a57e863ff8b2e0ebf64bb44ccc46fbe17 +size 2758491936 diff --git a/QiMing-Holos-Plus-8B.i1-IQ2_XS.gguf b/QiMing-Holos-Plus-8B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..224e28f --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:954ebd74c068025e4eecb800352c323d15500baf391bde12e3572aa7d372d914 +size 2605784864 diff --git a/QiMing-Holos-Plus-8B.i1-IQ2_XXS.gguf b/QiMing-Holos-Plus-8B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..0224c97 --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cdb8cf2e35287765384a16f487041316aafafe7fc04074191407841889b542f +size 2399215392 diff --git a/QiMing-Holos-Plus-8B.i1-IQ3_M.gguf b/QiMing-Holos-Plus-8B.i1-IQ3_M.gguf new file mode 100644 index 0000000..a9247a1 --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b7384f1492aaf3606dbe4e6f0d7c90c64ea96bf98d9217093e30478f2f4da10 +size 3784826656 diff --git a/QiMing-Holos-Plus-8B.i1-IQ3_S.gguf b/QiMing-Holos-Plus-8B.i1-IQ3_S.gguf new file mode 100644 index 0000000..0db347d --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f841d8a44e9e22ada05319fe15370d62a7ece41a807147fb9c90cd625a0a717b +size 3682328352 diff --git a/QiMing-Holos-Plus-8B.i1-IQ3_XS.gguf b/QiMing-Holos-Plus-8B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..0ac59b1 --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b36638ca3dce4bda3f6e4a6519ea09af7949efc779c9f962cb69dfbdfb10e30 +size 3518750496 diff --git a/QiMing-Holos-Plus-8B.i1-IQ3_XXS.gguf b/QiMing-Holos-Plus-8B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..b2ec97c --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08b935375d5a50be5e09620c4bbc100e72d5a645a2dac4ec6e5c8ea42040174a +size 3274915616 diff --git a/QiMing-Holos-Plus-8B.i1-IQ4_NL.gguf b/QiMing-Holos-Plus-8B.i1-IQ4_NL.gguf new file mode 100644 index 0000000..4483cd4 --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b75d592dfadc288e3b02c9db5be545e1a32b44cd2c395aa2781dfed014f9425 +size 4677992224 diff --git a/QiMing-Holos-Plus-8B.i1-IQ4_XS.gguf b/QiMing-Holos-Plus-8B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..0c425a8 --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9f32277ca301b65a3b0a716b00553d1d5a905ae2062e8c65e7f65db668d64eb +size 4447665952 diff --git a/QiMing-Holos-Plus-8B.i1-Q2_K.gguf b/QiMing-Holos-Plus-8B.i1-Q2_K.gguf new file mode 100644 index 0000000..58c9653 --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f7766e47be76495410ed4c1650238c4029e8fac74c03433f19424b93c99b20f +size 3179134752 diff --git a/QiMing-Holos-Plus-8B.i1-Q2_K_S.gguf b/QiMing-Holos-Plus-8B.i1-Q2_K_S.gguf new file mode 100644 index 0000000..57ffffe --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e70a2ed06834b111898169726a012900f538340dda247caeb347180f901451f1 +size 2988818208 diff --git a/QiMing-Holos-Plus-8B.i1-Q3_K_L.gguf b/QiMing-Holos-Plus-8B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..e056633 --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44d5d804a56ea2753b7fe97f38919d88d67bd71e19d60558bfbfc3ca707c1f98 +size 4321959712 diff --git a/QiMing-Holos-Plus-8B.i1-Q3_K_M.gguf b/QiMing-Holos-Plus-8B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..d584b6b --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c539ff00ed2973a5e92ac70c0ecc8f8d4ff67bb680ab92e3d5de13b2672bbc2 +size 4018921248 diff --git a/QiMing-Holos-Plus-8B.i1-Q3_K_S.gguf b/QiMing-Holos-Plus-8B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..7b68131 --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0e74970dd115c1d4e9534876ce55acbf71cd7fb7f79baf310a558a382477f9c +size 3664502560 diff --git a/QiMing-Holos-Plus-8B.i1-Q4_0.gguf b/QiMing-Holos-Plus-8B.i1-Q4_0.gguf new file mode 100644 index 0000000..fcec020 --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f806fd0f5bf269707e3347d4c7d78861c849f417856891417f7ff28bcef1aa71 +size 4675895072 diff --git a/QiMing-Holos-Plus-8B.i1-Q4_1.gguf b/QiMing-Holos-Plus-8B.i1-Q4_1.gguf new file mode 100644 index 0000000..210b433 --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3781c9725adb71486fada472ea368a66bb8aa2799ce03bbee06333e825421699 +size 5130256160 diff --git a/QiMing-Holos-Plus-8B.i1-Q4_K_M.gguf b/QiMing-Holos-Plus-8B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..3167c5d --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a3f98508e4f590a363d262e56a8a60c1e2ec3883d7f357c8707d7d47e1915f1 +size 4920737568 diff --git a/QiMing-Holos-Plus-8B.i1-Q4_K_S.gguf b/QiMing-Holos-Plus-8B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..2a08a74 --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:578d7436ae64b8384848b9a61b67e7740d14a21718be1a11707cb01d9594d467 +size 4692672288 diff --git a/QiMing-Holos-Plus-8B.i1-Q5_K_M.gguf b/QiMing-Holos-Plus-8B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..c983124 --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1753ddd7e60675e5ccc72a27610418fe7ce8671eb0d12aebc0661806502483ab +size 5732990752 diff --git a/QiMing-Holos-Plus-8B.i1-Q5_K_S.gguf b/QiMing-Holos-Plus-8B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..9d5f27f --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:208901b2bc9a55705752a6571dfc6bd1eda56c08006ddf97fe088bd353db956a +size 5599297312 diff --git a/QiMing-Holos-Plus-8B.i1-Q6_K.gguf b/QiMing-Holos-Plus-8B.i1-Q6_K.gguf new file mode 100644 index 0000000..91bb793 --- /dev/null +++ b/QiMing-Holos-Plus-8B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98d3be7972997873f364d12c5a4022352d0ab478c0fa5edf43edd8c4b503b0bb +size 6596009760 diff --git a/QiMing-Holos-Plus-8B.imatrix.gguf b/QiMing-Holos-Plus-8B.imatrix.gguf new file mode 100644 index 0000000..dea4c05 --- /dev/null +++ b/QiMing-Holos-Plus-8B.imatrix.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5a1f8343aa970dcdc00bc96b3c1b8c6809193b0e47e706b0943861eb5f94c30 +size 5015200 diff --git a/README.md b/README.md new file mode 100644 index 0000000..3a9deaf --- /dev/null +++ b/README.md @@ -0,0 +1,98 @@ +--- +base_model: aifeifei798/QiMing-Holos-Plus-8B +language: +- zh +- en +library_name: transformers +license: llama3.1 +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- llama +- unsloth +- qiming +- qiming-holos +- bagua +- decision-making +- strategic-analysis +- cognitive-architecture +- chat +- lora +- philosophy-driven-ai +--- +## About + + + + + + + + + +weighted/imatrix quants of https://huggingface.co/aifeifei798/QiMing-Holos-Plus-8B + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#QiMing-Holos-Plus-8B-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.imatrix.gguf) | imatrix | 0.1 | imatrix file (for creating your own quants) | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-IQ1_S.gguf) | i1-IQ1_S | 2.1 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-IQ1_M.gguf) | i1-IQ1_M | 2.3 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 2.5 | | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 2.7 | | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-IQ2_S.gguf) | i1-IQ2_S | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-IQ2_M.gguf) | i1-IQ2_M | 3.0 | | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-Q2_K_S.gguf) | i1-Q2_K_S | 3.1 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-Q2_K.gguf) | i1-Q2_K | 3.3 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 3.4 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 3.6 | | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 3.8 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-IQ3_S.gguf) | i1-IQ3_S | 3.8 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-IQ3_M.gguf) | i1-IQ3_M | 3.9 | | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 4.1 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 4.4 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 4.5 | | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-Q4_0.gguf) | i1-Q4_0 | 4.8 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-IQ4_NL.gguf) | i1-IQ4_NL | 4.8 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 4.8 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 5.0 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-Q4_1.gguf) | i1-Q4_1 | 5.2 | | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 5.7 | | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 5.8 | | +| [GGUF](https://huggingface.co/mradermacher/QiMing-Holos-Plus-8B-i1-GGUF/resolve/main/QiMing-Holos-Plus-8B.i1-Q6_K.gguf) | i1-Q6_K | 6.7 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + +