commit eaee9e2cb8eb2c545d409d4f69709cf07595edb9 Author: ModelHub XC Date: Fri May 8 19:29:03 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: SimplySara/LocoOperator-4B-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..d1606c4 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,64 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-MXFP4_MOE.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-Q5_1.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B-i1-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +LocoOperator-4B.imatrix.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/LocoOperator-4B-i1-IQ1_M.gguf b/LocoOperator-4B-i1-IQ1_M.gguf new file mode 100644 index 0000000..d46c0d6 --- /dev/null +++ b/LocoOperator-4B-i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97759ec33ae92b604f341ff72ab8e5ae9284d4a516858c960e783ac18d7374c7 +size 1127016576 diff --git a/LocoOperator-4B-i1-IQ1_S.gguf b/LocoOperator-4B-i1-IQ1_S.gguf new file mode 100644 index 0000000..d4b40f8 --- /dev/null +++ b/LocoOperator-4B-i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b561ebff73a239b1a99316242960fdbb2fe9e83d5c960f34c7088541a00cfd7 +size 1055254656 diff --git a/LocoOperator-4B-i1-IQ2_M.gguf b/LocoOperator-4B-i1-IQ2_M.gguf new file mode 100644 index 0000000..0f9ddcb --- /dev/null +++ b/LocoOperator-4B-i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3f925768783361f8a5314439d00c0fbe314cebab82317d05aabb97e9409c325 +size 1512982656 diff --git a/LocoOperator-4B-i1-IQ2_S.gguf b/LocoOperator-4B-i1-IQ2_S.gguf new file mode 100644 index 0000000..8b0cef2 --- /dev/null +++ b/LocoOperator-4B-i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c8d0dcd6fe59debb2c4a7e7eb0d888e601d7a9f32f0c416dd73a58d919a98ab +size 1417300096 diff --git a/LocoOperator-4B-i1-IQ2_XS.gguf b/LocoOperator-4B-i1-IQ2_XS.gguf new file mode 100644 index 0000000..7c1d43d --- /dev/null +++ b/LocoOperator-4B-i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e201a6719ef280aea8e5884aa93f6d31cd3357735177eee8feb36235de4e9c37 +size 1354098816 diff --git a/LocoOperator-4B-i1-IQ2_XXS.gguf b/LocoOperator-4B-i1-IQ2_XXS.gguf new file mode 100644 index 0000000..8027741 --- /dev/null +++ b/LocoOperator-4B-i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af6921ab2e845475f877a22fba256cb42c6312f9ee51b328e5055c8b7a73325 +size 1246619776 diff --git a/LocoOperator-4B-i1-IQ3_M.gguf b/LocoOperator-4B-i1-IQ3_M.gguf new file mode 100644 index 0000000..3d3a5ef --- /dev/null +++ b/LocoOperator-4B-i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5da9d59fd7b547dd24af0749a5f4698c97844245182c035a5e6abf1bfbb9af3 +size 1962894976 diff --git a/LocoOperator-4B-i1-IQ3_S.gguf b/LocoOperator-4B-i1-IQ3_S.gguf new file mode 100644 index 0000000..ad734fe --- /dev/null +++ b/LocoOperator-4B-i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c37f0eaccf94fe3765ce9b2649c0a5a2596470b8f13d2970eacc752c7ef86643 +size 1899529856 diff --git a/LocoOperator-4B-i1-IQ3_XS.gguf b/LocoOperator-4B-i1-IQ3_XS.gguf new file mode 100644 index 0000000..f011956 --- /dev/null +++ b/LocoOperator-4B-i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e231e115d69b439be749fee74c5c1835ac4911b40a8c627d2e4a67de664e65ae +size 1814374016 diff --git a/LocoOperator-4B-i1-IQ3_XXS.gguf b/LocoOperator-4B-i1-IQ3_XXS.gguf new file mode 100644 index 0000000..413dc7a --- /dev/null +++ b/LocoOperator-4B-i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4c2eb5c80727d61728c6045fa986d6cfe98a85ddadf1dbc944aec07b99cc26b +size 1670187136 diff --git a/LocoOperator-4B-i1-IQ4_NL.gguf b/LocoOperator-4B-i1-IQ4_NL.gguf new file mode 100644 index 0000000..453db01 --- /dev/null +++ b/LocoOperator-4B-i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c11e0d53bea7d34de5f063793ceddc80b8a5c5392540ee09d038565b4261e74 +size 2381342336 diff --git a/LocoOperator-4B-i1-IQ4_XS.gguf b/LocoOperator-4B-i1-IQ4_XS.gguf new file mode 100644 index 0000000..3743f33 --- /dev/null +++ b/LocoOperator-4B-i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c250eb26b67cf2f5235e5b2151dd46d89712d6bbb05f5a1b4f0db33231609cef +size 2270750336 diff --git a/LocoOperator-4B-i1-MXFP4_MOE.gguf b/LocoOperator-4B-i1-MXFP4_MOE.gguf new file mode 100644 index 0000000..fb82a2b --- /dev/null +++ b/LocoOperator-4B-i1-MXFP4_MOE.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25dbef25e18b7c0aae4f6a286056f1a5ef68162e69d5c4c895111ce9867d5d69 +size 4280404096 diff --git a/LocoOperator-4B-i1-Q2_K.gguf b/LocoOperator-4B-i1-Q2_K.gguf new file mode 100644 index 0000000..0a913f7 --- /dev/null +++ b/LocoOperator-4B-i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d809fa284457894e09fa7da0fb15e991186e06d80093a2a7e1bbf10b3847649 +size 1669498496 diff --git a/LocoOperator-4B-i1-Q2_K_S.gguf b/LocoOperator-4B-i1-Q2_K_S.gguf new file mode 100644 index 0000000..1e87575 --- /dev/null +++ b/LocoOperator-4B-i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7c73624e270fee13a18d5da85fe068fe05cd7804c86cf4acb146624e35abafd +size 1563453056 diff --git a/LocoOperator-4B-i1-Q3_K_L.gguf b/LocoOperator-4B-i1-Q3_K_L.gguf new file mode 100644 index 0000000..7463545 --- /dev/null +++ b/LocoOperator-4B-i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b97276ea098c01530d1f0efc83aafa159b1231f9f6ab02f41b393e3eaaf780d +size 2239784576 diff --git a/LocoOperator-4B-i1-Q3_K_M.gguf b/LocoOperator-4B-i1-Q3_K_M.gguf new file mode 100644 index 0000000..a2a09ff --- /dev/null +++ b/LocoOperator-4B-i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbb4724130754050c808e2ca8c057a5a7001083fab9722063a5151a7a4dca380 +size 2075616896 diff --git a/LocoOperator-4B-i1-Q3_K_S.gguf b/LocoOperator-4B-i1-Q3_K_S.gguf new file mode 100644 index 0000000..ed153dc --- /dev/null +++ b/LocoOperator-4B-i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:173473681806845f2fe75598623fd9c049ef448ec0bf0ee0483d5a9bda04627e +size 1886996096 diff --git a/LocoOperator-4B-i1-Q4_0.gguf b/LocoOperator-4B-i1-Q4_0.gguf new file mode 100644 index 0000000..426536b --- /dev/null +++ b/LocoOperator-4B-i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12d5eac9356e505071f3c1583b64a727e98e79a40e33546785cbb0d4e34fdd23 +size 2375771776 diff --git a/LocoOperator-4B-i1-Q4_1.gguf b/LocoOperator-4B-i1-Q4_1.gguf new file mode 100644 index 0000000..f39cf16 --- /dev/null +++ b/LocoOperator-4B-i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2abae241ca83ca2a400f19d4bb3ed251a301513c4fc571b0e2dd29af644745d7 +size 2596628096 diff --git a/LocoOperator-4B-i1-Q4_K_M.gguf b/LocoOperator-4B-i1-Q4_K_M.gguf new file mode 100644 index 0000000..2a2b7fe --- /dev/null +++ b/LocoOperator-4B-i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4acfade3fc6c6a3e5785b7aa4d9ab8feccffeae54c97178d3f41d95709c10705 +size 2497279616 diff --git a/LocoOperator-4B-i1-Q4_K_S.gguf b/LocoOperator-4B-i1-Q4_K_S.gguf new file mode 100644 index 0000000..1b67b29 --- /dev/null +++ b/LocoOperator-4B-i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14b99d24c3821ed7328487bcccedc7cd64b762ad152d35151958d706ac43408a +size 2383308416 diff --git a/LocoOperator-4B-i1-Q5_0.gguf b/LocoOperator-4B-i1-Q5_0.gguf new file mode 100644 index 0000000..be971d1 --- /dev/null +++ b/LocoOperator-4B-i1-Q5_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d80fb388626f1745294c1f2eed91daadbf01e6f6dfca6be9c46851e02c164b85 +size 2829936256 diff --git a/LocoOperator-4B-i1-Q5_1.gguf b/LocoOperator-4B-i1-Q5_1.gguf new file mode 100644 index 0000000..6586791 --- /dev/null +++ b/LocoOperator-4B-i1-Q5_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:266927d5893afe2243bfb7fa0a4cb505a11cda2b365bc1f937d6b849238031cf +size 3050792576 diff --git a/LocoOperator-4B-i1-Q5_K_M.gguf b/LocoOperator-4B-i1-Q5_K_M.gguf new file mode 100644 index 0000000..e860797 --- /dev/null +++ b/LocoOperator-4B-i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b1b7ac05dbfb905f1175f6569f26fda6c0cde0c0620b5181af6fc8766ddd23f +size 2889512576 diff --git a/LocoOperator-4B-i1-Q5_K_S.gguf b/LocoOperator-4B-i1-Q5_K_S.gguf new file mode 100644 index 0000000..a6c96b5 --- /dev/null +++ b/LocoOperator-4B-i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:546b4c50c27002e9e4353f4e4983844c5563d1bc626a7e1b671fc0de70913cbe +size 2823710336 diff --git a/LocoOperator-4B-i1-Q6_K.gguf b/LocoOperator-4B-i1-Q6_K.gguf new file mode 100644 index 0000000..8499115 --- /dev/null +++ b/LocoOperator-4B-i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0967cda05cf46393b6019ab788dad343ef7f0eba935373f15deac90b004682c +size 3306260096 diff --git a/LocoOperator-4B-i1-Q8_0.gguf b/LocoOperator-4B-i1-Q8_0.gguf new file mode 100644 index 0000000..8af418a --- /dev/null +++ b/LocoOperator-4B-i1-Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08568c3e3f73f32aa966dae5dd7505501f9d4b3572e768de4965473f19e71036 +size 4280404096 diff --git a/LocoOperator-4B.imatrix.gguf b/LocoOperator-4B.imatrix.gguf new file mode 100644 index 0000000..a9f7ba8 --- /dev/null +++ b/LocoOperator-4B.imatrix.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae2949eed0c52e584edd8b055c111b654a461a841f031e795eb7477bdbdc0e49 +size 3872640 diff --git a/README.md b/README.md new file mode 100644 index 0000000..83d96a7 --- /dev/null +++ b/README.md @@ -0,0 +1,229 @@ +--- +library_name: transformers +license: mit +base_model: +- LocoreMind/LocoOperator-4B +tags: +- code +- agent +- tool-calling +- distillation +- qwen3 +- gguf +- llama-cpp +language: +- en +pipeline_tag: text-generation +--- +# This is a Imatrix quantization of [LocoreMind/LocoOperator-4B](https://huggingface.co/LocoreMind/LocoOperator-4B), made by [SimplySara](https://huggingface.co/SimplySara) + +| Model | Size_GB | BPW | PPL_Q | KLD_Mean | KLD_Max | Top_P_Match | +|:----------------------------------|----------:|------:|----------:|-----------:|----------:|:--------------| +| LocoOperator-4B-BF16.gguf | 7.498 | 16.01 | 9.24309 | -1.2e-05 | 4e-06 | 100.000% | +| LocoOperator-4B-MXFP4_MOE.gguf | 3.986 | 8.51 | 9.24606 | 0.001835 | 2.98238 | 97.518% | +| LocoOperator-4B-i1-MXFP4_MOE.gguf | 3.986 | 8.51 | 9.24606 | 0.001835 | 2.98238 | 97.518% | +| LocoOperator-4B-Q8_0.gguf | 3.986 | 8.51 | 9.24606 | 0.001835 | 2.98238 | 97.518% | +| LocoOperator-4B-i1-Q8_0.gguf | 3.986 | 8.51 | 9.24606 | 0.001835 | 2.98238 | 97.518% | +| LocoOperator-4B-Q6_K.gguf | 3.079 | 6.58 | 9.27926 | 0.0068 | 10.5686 | 95.526% | +| LocoOperator-4B-i1-Q6_K.gguf | 3.079 | 6.58 | 9.295 | 0.006075 | 15.9945 | 95.857% | +| LocoOperator-4B-i1-Q5_1.gguf | 2.841 | 6.07 | 9.28859 | 0.01364 | 2.98838 | 94.135% | +| LocoOperator-4B-Q5_1.gguf | 2.841 | 6.07 | 9.43222 | 0.022675 | 16.3454 | 93.161% | +| LocoOperator-4B-Q5_K_M.gguf | 2.691 | 5.75 | 9.35457 | 0.017023 | 12.3947 | 93.635% | +| LocoOperator-4B-i1-Q5_K_M.gguf | 2.691 | 5.75 | 9.2965 | 0.013153 | 7.78613 | 94.257% | +| LocoOperator-4B-i1-Q5_0.gguf | 2.636 | 5.63 | 9.42255 | 0.019663 | 17.94 | 93.208% | +| LocoOperator-4B-Q5_0.gguf | 2.63 | 5.62 | 9.41521 | 0.023403 | 31.4019 | 92.839% | +| LocoOperator-4B-Q5_K_S.gguf | 2.63 | 5.62 | 9.44087 | 0.022119 | 13.6483 | 92.800% | +| LocoOperator-4B-i1-Q5_K_S.gguf | 2.63 | 5.62 | 9.28767 | 0.014865 | 7.65169 | 93.702% | +| LocoOperator-4B-Q4_1.gguf | 2.418 | 5.16 | 9.66722 | 0.074718 | 15.0861 | 87.757% | +| LocoOperator-4B-i1-Q4_1.gguf | 2.418 | 5.16 | 9.45293 | 0.038707 | 13.8444 | 90.574% | +| LocoOperator-4B-Q4_K_M.gguf | 2.326 | 4.97 | 9.48239 | 0.048236 | 15.3105 | 90.300% | +| LocoOperator-4B-i1-Q4_K_M.gguf | 2.326 | 4.97 | 9.48582 | 0.03368 | 13.551 | 91.233% | +| LocoOperator-4B-IQ4_NL.gguf | 2.229 | 4.76 | 9.60891 | 0.050173 | 11.4324 | 89.708% | +| LocoOperator-4B-i1-Q4_K_S.gguf | 2.22 | 4.74 | 9.47603 | 0.039843 | 10.0551 | 90.557% | +| LocoOperator-4B-Q4_K_S.gguf | 2.22 | 4.74 | 9.80236 | 0.068821 | 15.209 | 88.513% | +| LocoOperator-4B-i1-IQ4_NL.gguf | 2.218 | 4.74 | 9.50223 | 0.039414 | 8.18964 | 90.573% | +| LocoOperator-4B-i1-Q4_0.gguf | 2.213 | 4.73 | 9.79026 | 0.063915 | 12.6928 | 88.737% | +| LocoOperator-4B-Q4_0.gguf | 2.207 | 4.71 | 9.86629 | 0.074527 | 13.2501 | 87.758% | +| LocoOperator-4B-IQ4_XS.gguf | 2.129 | 4.55 | 9.62193 | 0.051911 | 11.0682 | 89.705% | +| LocoOperator-4B-i1-IQ4_XS.gguf | 2.115 | 4.52 | 9.49687 | 0.040098 | 7.03875 | 90.402% | +| LocoOperator-4B-Q3_K_L.gguf | 2.086 | 4.45 | 10.2476 | 0.121944 | 27.0257 | 84.146% | +| LocoOperator-4B-i1-Q3_K_L.gguf | 2.086 | 4.45 | 9.90811 | 0.090874 | 15.8122 | 86.154% | +| LocoOperator-4B-Q3_K_M.gguf | 1.933 | 4.13 | 10.7021 | 0.15788 | 20.2044 | 82.662% | +| LocoOperator-4B-i1-Q3_K_M.gguf | 1.933 | 4.13 | 9.98057 | 0.102708 | 16.8243 | 85.354% | +| LocoOperator-4B-i1-IQ3_M.gguf | 1.828 | 3.9 | 10.1634 | 0.137347 | 14.6883 | 83.180% | +| LocoOperator-4B-IQ3_M.gguf | 1.828 | 3.9 | 14.2539 | 0.557713 | 19.4397 | 67.631% | +| LocoOperator-4B-IQ3_S.gguf | 1.769 | 3.78 | 15.0624 | 0.619131 | 20.122 | 65.931% | +| LocoOperator-4B-i1-IQ3_S.gguf | 1.769 | 3.78 | 10.1755 | 0.142066 | 17.0028 | 83.139% | +| LocoOperator-4B-i1-Q3_K_S.gguf | 1.757 | 3.75 | 10.8886 | 0.171224 | 28.3373 | 82.133% | +| LocoOperator-4B-Q3_K_S.gguf | 1.757 | 3.75 | 11.5475 | 0.237895 | 30.6868 | 79.412% | +| LocoOperator-4B-i1-IQ3_XS.gguf | 1.69 | 3.61 | 10.3629 | 0.168783 | 14.3358 | 81.928% | +| LocoOperator-4B-i1-Q2_K.gguf | 1.555 | 3.32 | 12.1574 | 0.328652 | 18.6622 | 75.570% | +| LocoOperator-4B-i1-IQ3_XXS.gguf | 1.555 | 3.32 | 11.2795 | 0.263448 | 25.251 | 77.569% | +| LocoOperator-4B-Q2_K.gguf | 1.555 | 3.32 | 17.153 | 0.713596 | 16.3946 | 64.880% | +| LocoOperator-4B-i1-Q2_K_S.gguf | 1.456 | 3.11 | 13.1709 | 0.450125 | 18.3826 | 71.231% | +| LocoOperator-4B-i1-IQ2_M.gguf | 1.409 | 3.01 | 14.0857 | 0.544764 | 18.5618 | 67.933% | +| LocoOperator-4B-i1-IQ2_S.gguf | 1.32 | 2.82 | 15.0717 | 0.621189 | 24.0981 | 65.722% | +| LocoOperator-4B-i1-IQ2_XS.gguf | 1.261 | 2.69 | 16.8277 | 0.750336 | 19.2128 | 63.162% | +| LocoOperator-4B-i1-IQ2_XXS.gguf | 1.161 | 2.48 | 27.5988 | 1.32144 | 14.6807 | 52.522% | +| LocoOperator-4B-i1-IQ1_M.gguf | 1.05 | 2.24 | 49.0978 | 1.9323 | 16.5947 | 44.067% | +| LocoOperator-4B-i1-IQ1_S.gguf | 0.983 | 2.1 | 139.951 | 3.03274 | 16.0947 | 28.387% | + + +------ + +
+ LocoOperator +
+ +
+ +
+ +[![MODEL](https://img.shields.io/badge/Model-FFB300?style=for-the-badge&logo=huggingface&logoColor=white)](https://huggingface.co/LocoreMind/LocoOperator-4B) +[![GGUF](https://img.shields.io/badge/GGUF-FF6F00?style=for-the-badge&logo=huggingface&logoColor=white)](https://huggingface.co/LocoreMind/LocoOperator-4B-GGUF) +[![Blog](https://img.shields.io/badge/Blog-4285F4?style=for-the-badge&logo=google-chrome&logoColor=white)](https://locoremind.com/blog/loco-operator) +[![GitHub](https://img.shields.io/badge/GitHub-181717?style=for-the-badge&logo=github&logoColor=white)](https://github.com/LocoreMind/LocoOperator) +[![Colab](https://img.shields.io/badge/Colab-F9AB00?style=for-the-badge&logo=googlecolab&logoColor=white)](https://colab.research.google.com/github/LocoreMind/LocoOperator/blob/main/LocoOperator_4B.ipynb) + +
+ +## Introduction + +**LocoOperator-4B** is a 4B-parameter tool-calling agent model trained via knowledge distillation from **Qwen3-Coder-Next** inference traces. It specializes in multi-turn codebase exploration — reading files, searching code, and navigating project structures within a Claude Code-style agent loop. Designed as a local sub agent, it runs via llama.cpp at zero API cost. + +| | LocoOperator-4B | +|:--|:--| +| **Base Model** | [Qwen3-4B-Instruct-2507](https://huggingface.co/Qwen/Qwen3-4B-Instruct-2507) | +| **Teacher Model** | Qwen3-Coder-Next | +| **Training Method** | Full-parameter SFT (distillation) | +| **Training Data** | 170,356 multi-turn conversation samples | +| **Max Sequence Length** | 16,384 tokens | +| **Training Hardware** | 4x NVIDIA H200 141GB SXM5 | +| **Training Time** | ~25 hours | +| **Framework** | MS-SWIFT | + +## Key Features + +- **Tool-Calling Agent**: Generates structured `` JSON for Read, Grep, Glob, Bash, Write, Edit, and Task (subagent delegation) +- **100% JSON Validity**: Every tool call is valid JSON with all required arguments — outperforming the teacher model (87.6%) +- **Local Deployment**: GGUF quantized, runs on Mac Studio via llama.cpp at zero API cost +- **Lightweight Explorer**: 4B parameters, optimized for fast codebase search and navigation +- **Multi-Turn**: Handles conversation depths of 3–33 messages with consistent tool-calling behavior + +## Performance + +Evaluated on 65 multi-turn conversation samples from diverse open-source projects (scipy, fastapi, arrow, attrs, gevent, gunicorn, etc.), with labels generated by Qwen3-Coder-Next. + +### Core Metrics + +| Metric | Score | +|:-------|:-----:| +| **Tool Call Presence Alignment** | **100%** (65/65) | +| **First Tool Type Match** | **65.6%** (40/61) | +| **JSON Validity** | **100%** (76/76) | +| **Argument Syntax Correctness** | **100%** (76/76) | + +The model perfectly learned *when* to use tools vs. when to respond with text (100% presence alignment). Tool type mismatches are between semantically similar tools (e.g. Grep vs Read) — different but often valid strategies. + +### Tool Distribution Comparison + +
+ Tool Distribution Comparison +
+ +### JSON & Argument Syntax Correctness + +| Model | JSON Valid | Argument Syntax Valid | +|:------|:---------:|:--------------------:| +| **LocoOperator-4B** | 76/76 (100%) | 76/76 (100%) | +| Qwen3-Coder-Next (teacher) | 89/89 (100%) | 78/89 (87.6%) | + +> LocoOperator-4B achieves perfect structured output. The teacher model has 11 tool calls with missing required arguments (empty `arguments: {}`). + +## Quick Start + +```python +from transformers import AutoModelForCausalLM, AutoTokenizer + +model_name = "LocoreMind/LocoOperator-4B" + +# load the tokenizer and the model +tokenizer = AutoTokenizer.from_pretrained(model_name) +model = AutoModelForCausalLM.from_pretrained( + model_name, + torch_dtype="auto", + device_map="auto" +) + +# prepare the messages +messages = [ + { + "role": "system", + "content": "You are a read-only codebase search specialist.\n\nCRITICAL CONSTRAINTS:\n1. STRICTLY READ-ONLY: You cannot create, edit, delete, move files, or run any state-changing commands. Use tools/bash ONLY for reading (e.g., ls, find, cat, grep).\n2. EFFICIENCY: Spawn multiple parallel tool calls for faster searching.\n3. OUTPUT RULES: \n - ALWAYS use absolute file paths.\n - STRICTLY NO EMOJIS in your response.\n - Output your final report directly. Do not use colons before tool calls.\n\nENV: Working directory is /Users/developer/workspace/code-analyzer (macOS, zsh)." + }, + { + "role": "user", + "content": "Analyze the Black codebase at `/Users/developer/workspace/code-analyzer/projects/black`.\nFind and explain:\n1. How Black discovers config files.\n2. The exact search order for config files.\n3. Supported config file formats.\n4. Where this configuration discovery logic lives in the codebase.\n\nReturn a comprehensive answer with relevant code snippets and absolute file paths." + } +] + +# prepare the model input +text = tokenizer.apply_chat_template( + messages, + tokenize=False, + add_generation_prompt=True, +) +model_inputs = tokenizer([text], return_tensors="pt").to(model.device) + +# conduct text completion +generated_ids = model.generate( + **model_inputs, + max_new_tokens=512, +) +output_ids = generated_ids[0][len(model_inputs.input_ids[0]):].tolist() + +content = tokenizer.decode(output_ids, skip_special_tokens=True) +print(content) +``` + +## Local Deployment + +For GGUF quantized deployment with llama.cpp, hybrid proxy routing, and batch analysis pipelines, refer to our [GitHub repository](https://github.com/LocoreMind/LocoOperator). + +## Training Details + +| Parameter | Value | +|:----------|:------| +| Base model | Qwen3-4B-Instruct-2507 | +| Teacher model | Qwen3-Coder-Next | +| Method | Full-parameter SFT | +| Training data | 170,356 samples | +| Hardware | 4x NVIDIA H200 141GB SXM5 | +| Parallelism | DDP (no DeepSpeed) | +| Precision | BF16 | +| Epochs | 1 | +| Batch size | 2/GPU, gradient accumulation 4 (effective batch 32) | +| Learning rate | 2e-5, warmup ratio 0.03 | +| Max sequence length | 16,384 tokens | +| Template | qwen3_nothinking | +| Framework | MS-SWIFT | +| Training time | ~25 hours | +| Checkpoint | Step 2524 | + +## Known Limitations + +- First-tool-type match is 65.6% — the model sometimes picks a different (but not necessarily wrong) tool than the teacher +- Tends to under-generate parallel tool calls compared to the teacher (76 vs 89 total calls across 65 samples) +- Preference for Bash over Read may indicate the model defaults to shell commands where file reads would be more appropriate +- Evaluated on 65 samples only; larger-scale evaluation needed + +## License + +MIT + +## Acknowledgments + +- [Qwen Team](https://huggingface.co/Qwen) for the Qwen3-4B-Instruct-2507 base model +- [MS-SWIFT](https://github.com/modelscope/ms-swift) for the training framework +- [llama.cpp](https://github.com/ggerganov/llama.cpp) for efficient local inference +- [Anthropic](https://www.anthropic.com/) for the Claude Code agent loop design that inspired this work \ No newline at end of file