commit 6b1ca0ea58570a85466ca0d755b17aeae5951696 Author: ModelHub XC Date: Sat May 2 17:02:29 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: prithivMLmods/MemOperator-4B-f32-GGUF Source: Original Platform diff --git a/ MemOperator-4B.BF16.gguf b/ MemOperator-4B.BF16.gguf new file mode 100644 index 0000000..fe2c0a9 --- /dev/null +++ b/ MemOperator-4B.BF16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:376d0c3e256fcd791295ee9d4d64f4d435f919dcf59ba4c50a528c52f021b6a9 +size 8051284704 diff --git a/ MemOperator-4B.F16.gguf b/ MemOperator-4B.F16.gguf new file mode 100644 index 0000000..c5662b2 --- /dev/null +++ b/ MemOperator-4B.F16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c3b44ec90a4143d7d766cd3286ab8093469f81bbec6d5443250abae65aa59f8 +size 8051284704 diff --git a/ MemOperator-4B.F32.gguf b/ MemOperator-4B.F32.gguf new file mode 100644 index 0000000..fd41a69 --- /dev/null +++ b/ MemOperator-4B.F32.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7e570ec23f244fbe4f552cafc0d9121cbe31b88d2a2dfe246651e2a21a32aa4 +size 16095828704 diff --git a/ MemOperator-4B.Q2_K.gguf b/ MemOperator-4B.Q2_K.gguf new file mode 100644 index 0000000..08cbbee --- /dev/null +++ b/ MemOperator-4B.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bd1e18ca1b1700fd7490564078a2f6409e4411030860216c42c4de8c45f0705 +size 1669499104 diff --git a/ MemOperator-4B.Q3_K_L.gguf b/ MemOperator-4B.Q3_K_L.gguf new file mode 100644 index 0000000..ee72dcb --- /dev/null +++ b/ MemOperator-4B.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d487cdca79da4f4693ddddecc84e91a7e11354e7e6c39841a981678036f1ac4 +size 2239785184 diff --git a/ MemOperator-4B.Q3_K_M.gguf b/ MemOperator-4B.Q3_K_M.gguf new file mode 100644 index 0000000..d00aea5 --- /dev/null +++ b/ MemOperator-4B.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89ae74d20d39df28afed238d97567b5bb6d86d19f91bd4ade685c07d10a26bf6 +size 2075617504 diff --git a/ MemOperator-4B.Q3_K_S.gguf b/ MemOperator-4B.Q3_K_S.gguf new file mode 100644 index 0000000..04ca8c7 --- /dev/null +++ b/ MemOperator-4B.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b7ffc9ff3472a1fee0bbe84e83a56e9bde426c989f671a7dbae3a2a25c3d9cb +size 1886996704 diff --git a/ MemOperator-4B.Q4_K_M.gguf b/ MemOperator-4B.Q4_K_M.gguf new file mode 100644 index 0000000..0ff221d --- /dev/null +++ b/ MemOperator-4B.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11d6e9e80e08853d19b2392452cfda637b6a3baf6c83a5957ae4b43da50e7c9b +size 2497280224 diff --git a/ MemOperator-4B.Q4_K_S.gguf b/ MemOperator-4B.Q4_K_S.gguf new file mode 100644 index 0000000..216b269 --- /dev/null +++ b/ MemOperator-4B.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cb55a1dfc23eb4395dd6e4c996d0065fd8c2eac350b620c2bdf5a02a715e241 +size 2383309024 diff --git a/ MemOperator-4B.Q5_K_M.gguf b/ MemOperator-4B.Q5_K_M.gguf new file mode 100644 index 0000000..68260db --- /dev/null +++ b/ MemOperator-4B.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:081f03410ec3b49b754c9a60d1dc672fb989149d321db1a445aac80063ea059b +size 2889513184 diff --git a/ MemOperator-4B.Q5_K_S.gguf b/ MemOperator-4B.Q5_K_S.gguf new file mode 100644 index 0000000..8fbb01a --- /dev/null +++ b/ MemOperator-4B.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f137bff768e41f632c11c61220f99e1151b14c1bdfa051baa008c3f9e646a228 +size 2823710944 diff --git a/ MemOperator-4B.Q6_K.gguf b/ MemOperator-4B.Q6_K.gguf new file mode 100644 index 0000000..4e16df2 --- /dev/null +++ b/ MemOperator-4B.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eabd11d88e420acea49be892581d01978957b326a60b78cc8da21e035f28295f +size 3306260704 diff --git a/ MemOperator-4B.Q8_0.gguf b/ MemOperator-4B.Q8_0.gguf new file mode 100644 index 0000000..b91427a --- /dev/null +++ b/ MemOperator-4B.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18ead8ef725bd114a8ae4e84436bc8a36297855f9ca9976287ab961155f02b82 +size 4280404704 diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..53d7257 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bin.* filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zstandard filter=lfs diff=lfs merge=lfs -text +*.tfevents* filter=lfs diff=lfs merge=lfs -text +*.db* filter=lfs diff=lfs merge=lfs -text +*.ark* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.gguf* filter=lfs diff=lfs merge=lfs -text +*.ggml filter=lfs diff=lfs merge=lfs -text +*.llamafile* filter=lfs diff=lfs merge=lfs -text +*.pt2 filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text \ No newline at end of file diff --git a/README.md b/README.md new file mode 100644 index 0000000..ad40358 --- /dev/null +++ b/README.md @@ -0,0 +1,44 @@ +--- +license: apache-2.0 +base_model: +- MemTensor/MemOperator-4B +language: +- en +pipeline_tag: text-generation +library_name: transformers +tags: +- text-generation-inference +--- + +# **MemOperator-4B-f32-GGUF** + +> MemOperator-4B by MemTensor is a specialized causal language model designed for efficient memory operations within the MemOS system. It excels in memory extraction, integration, and updating while enabling local-only deployment for environments without internet access. Derived from the Qwen3-4B architecture and fine-tuned via supervised learning on both human-annotated and generated data, this 4 billion parameter model supports both English and Chinese, and processes long contexts up to 32,768 tokens. + +> It offers fast, low-resource memory management that outperforms comparably sized open models like GPT-4o-mini, making it ideal for real-time, cost-effective memory tasks in conversational and document settings. MemOperator-4B is designed to seamlessly extract high-quality memories and organize them for enhanced long-term coherence in applications such as MemOS, supporting memory-centric AI workflows with strong multilingual capabilities and robust system performance. + +## Model Files + +| Model File name | Size | QuantType | +|---|---|---| +| MemOperator-4B.BF16.gguf | 8.05 GB | BF16 | +| MemOperator-4B.F16.gguf | 8.05 GB | F16 | +| MemOperator-4B.F32.gguf | 16.1 GB | F32 | +| MemOperator-4B.Q2_K.gguf | 1.67 GB | Q2_K | +| MemOperator-4B.Q3_K_L.gguf | 2.24 GB | Q3_K_L | +| MemOperator-4B.Q3_K_M.gguf | 2.08 GB | Q3_K_M | +| MemOperator-4B.Q3_K_S.gguf | 1.89 GB | Q3_K_S | +| MemOperator-4B.Q4_K_M.gguf | 2.5 GB | Q4_K_M | +| MemOperator-4B.Q4_K_S.gguf | 2.38 GB | Q4_K_S | +| MemOperator-4B.Q5_K_M.gguf | 2.89 GB | Q5_K_M | +| MemOperator-4B.Q5_K_S.gguf | 2.82 GB | Q5_K_S | +| MemOperator-4B.Q6_K.gguf | 3.31 GB | Q6_K | +| MemOperator-4B.Q8_0.gguf | 4.28 GB | Q8_0 | + +## Quants Usage + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000..5d0c447 --- /dev/null +++ b/config.json @@ -0,0 +1,3 @@ +{ + "model_type": "qwen3" +} \ No newline at end of file diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..bbeeda1 --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework": "pytorch", "task": "text-generation", "allow_remote": true} \ No newline at end of file