初始化项目,由ModelHub XC社区提供模型
Model: prithivMLmods/MemOperator-4B-f32-GGUF Source: Original Platform
This commit is contained in:
3
MemOperator-4B.BF16.gguf
Normal file
3
MemOperator-4B.BF16.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:376d0c3e256fcd791295ee9d4d64f4d435f919dcf59ba4c50a528c52f021b6a9
|
||||
size 8051284704
|
||||
3
MemOperator-4B.F16.gguf
Normal file
3
MemOperator-4B.F16.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:0c3b44ec90a4143d7d766cd3286ab8093469f81bbec6d5443250abae65aa59f8
|
||||
size 8051284704
|
||||
3
MemOperator-4B.F32.gguf
Normal file
3
MemOperator-4B.F32.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:a7e570ec23f244fbe4f552cafc0d9121cbe31b88d2a2dfe246651e2a21a32aa4
|
||||
size 16095828704
|
||||
3
MemOperator-4B.Q2_K.gguf
Normal file
3
MemOperator-4B.Q2_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:6bd1e18ca1b1700fd7490564078a2f6409e4411030860216c42c4de8c45f0705
|
||||
size 1669499104
|
||||
3
MemOperator-4B.Q3_K_L.gguf
Normal file
3
MemOperator-4B.Q3_K_L.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:4d487cdca79da4f4693ddddecc84e91a7e11354e7e6c39841a981678036f1ac4
|
||||
size 2239785184
|
||||
3
MemOperator-4B.Q3_K_M.gguf
Normal file
3
MemOperator-4B.Q3_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:89ae74d20d39df28afed238d97567b5bb6d86d19f91bd4ade685c07d10a26bf6
|
||||
size 2075617504
|
||||
3
MemOperator-4B.Q3_K_S.gguf
Normal file
3
MemOperator-4B.Q3_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:0b7ffc9ff3472a1fee0bbe84e83a56e9bde426c989f671a7dbae3a2a25c3d9cb
|
||||
size 1886996704
|
||||
3
MemOperator-4B.Q4_K_M.gguf
Normal file
3
MemOperator-4B.Q4_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:11d6e9e80e08853d19b2392452cfda637b6a3baf6c83a5957ae4b43da50e7c9b
|
||||
size 2497280224
|
||||
3
MemOperator-4B.Q4_K_S.gguf
Normal file
3
MemOperator-4B.Q4_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:8cb55a1dfc23eb4395dd6e4c996d0065fd8c2eac350b620c2bdf5a02a715e241
|
||||
size 2383309024
|
||||
3
MemOperator-4B.Q5_K_M.gguf
Normal file
3
MemOperator-4B.Q5_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:081f03410ec3b49b754c9a60d1dc672fb989149d321db1a445aac80063ea059b
|
||||
size 2889513184
|
||||
3
MemOperator-4B.Q5_K_S.gguf
Normal file
3
MemOperator-4B.Q5_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:f137bff768e41f632c11c61220f99e1151b14c1bdfa051baa008c3f9e646a228
|
||||
size 2823710944
|
||||
3
MemOperator-4B.Q6_K.gguf
Normal file
3
MemOperator-4B.Q6_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:eabd11d88e420acea49be892581d01978957b326a60b78cc8da21e035f28295f
|
||||
size 3306260704
|
||||
3
MemOperator-4B.Q8_0.gguf
Normal file
3
MemOperator-4B.Q8_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:18ead8ef725bd114a8ae4e84436bc8a36297855f9ca9976287ab961155f02b82
|
||||
size 4280404704
|
||||
47
.gitattributes
vendored
Normal file
47
.gitattributes
vendored
Normal file
@@ -0,0 +1,47 @@
|
||||
*.7z filter=lfs diff=lfs merge=lfs -text
|
||||
*.arrow filter=lfs diff=lfs merge=lfs -text
|
||||
*.bin filter=lfs diff=lfs merge=lfs -text
|
||||
*.bin.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
||||
*.ftz filter=lfs diff=lfs merge=lfs -text
|
||||
*.gz filter=lfs diff=lfs merge=lfs -text
|
||||
*.h5 filter=lfs diff=lfs merge=lfs -text
|
||||
*.joblib filter=lfs diff=lfs merge=lfs -text
|
||||
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.model filter=lfs diff=lfs merge=lfs -text
|
||||
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||
*.parquet filter=lfs diff=lfs merge=lfs -text
|
||||
*.pb filter=lfs diff=lfs merge=lfs -text
|
||||
*.pt filter=lfs diff=lfs merge=lfs -text
|
||||
*.pth filter=lfs diff=lfs merge=lfs -text
|
||||
*.rar filter=lfs diff=lfs merge=lfs -text
|
||||
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tflite filter=lfs diff=lfs merge=lfs -text
|
||||
*.tgz filter=lfs diff=lfs merge=lfs -text
|
||||
*.xz filter=lfs diff=lfs merge=lfs -text
|
||||
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||
*.zstandard filter=lfs diff=lfs merge=lfs -text
|
||||
*.tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||
*.db* filter=lfs diff=lfs merge=lfs -text
|
||||
*.ark* filter=lfs diff=lfs merge=lfs -text
|
||||
**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text
|
||||
**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text
|
||||
**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text
|
||||
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
||||
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
||||
*.gguf* filter=lfs diff=lfs merge=lfs -text
|
||||
*.ggml filter=lfs diff=lfs merge=lfs -text
|
||||
*.llamafile* filter=lfs diff=lfs merge=lfs -text
|
||||
*.pt2 filter=lfs diff=lfs merge=lfs -text
|
||||
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
||||
*.npy filter=lfs diff=lfs merge=lfs -text
|
||||
*.npz filter=lfs diff=lfs merge=lfs -text
|
||||
*.pickle filter=lfs diff=lfs merge=lfs -text
|
||||
*.pkl filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar filter=lfs diff=lfs merge=lfs -text
|
||||
*.wasm filter=lfs diff=lfs merge=lfs -text
|
||||
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||
44
README.md
Normal file
44
README.md
Normal file
@@ -0,0 +1,44 @@
|
||||
---
|
||||
license: apache-2.0
|
||||
base_model:
|
||||
- MemTensor/MemOperator-4B
|
||||
language:
|
||||
- en
|
||||
pipeline_tag: text-generation
|
||||
library_name: transformers
|
||||
tags:
|
||||
- text-generation-inference
|
||||
---
|
||||
|
||||
# **MemOperator-4B-f32-GGUF**
|
||||
|
||||
> MemOperator-4B by MemTensor is a specialized causal language model designed for efficient memory operations within the MemOS system. It excels in memory extraction, integration, and updating while enabling local-only deployment for environments without internet access. Derived from the Qwen3-4B architecture and fine-tuned via supervised learning on both human-annotated and generated data, this 4 billion parameter model supports both English and Chinese, and processes long contexts up to 32,768 tokens.
|
||||
|
||||
> It offers fast, low-resource memory management that outperforms comparably sized open models like GPT-4o-mini, making it ideal for real-time, cost-effective memory tasks in conversational and document settings. MemOperator-4B is designed to seamlessly extract high-quality memories and organize them for enhanced long-term coherence in applications such as MemOS, supporting memory-centric AI workflows with strong multilingual capabilities and robust system performance.
|
||||
|
||||
## Model Files
|
||||
|
||||
| Model File name | Size | QuantType |
|
||||
|---|---|---|
|
||||
| MemOperator-4B.BF16.gguf | 8.05 GB | BF16 |
|
||||
| MemOperator-4B.F16.gguf | 8.05 GB | F16 |
|
||||
| MemOperator-4B.F32.gguf | 16.1 GB | F32 |
|
||||
| MemOperator-4B.Q2_K.gguf | 1.67 GB | Q2_K |
|
||||
| MemOperator-4B.Q3_K_L.gguf | 2.24 GB | Q3_K_L |
|
||||
| MemOperator-4B.Q3_K_M.gguf | 2.08 GB | Q3_K_M |
|
||||
| MemOperator-4B.Q3_K_S.gguf | 1.89 GB | Q3_K_S |
|
||||
| MemOperator-4B.Q4_K_M.gguf | 2.5 GB | Q4_K_M |
|
||||
| MemOperator-4B.Q4_K_S.gguf | 2.38 GB | Q4_K_S |
|
||||
| MemOperator-4B.Q5_K_M.gguf | 2.89 GB | Q5_K_M |
|
||||
| MemOperator-4B.Q5_K_S.gguf | 2.82 GB | Q5_K_S |
|
||||
| MemOperator-4B.Q6_K.gguf | 3.31 GB | Q6_K |
|
||||
| MemOperator-4B.Q8_0.gguf | 4.28 GB | Q8_0 |
|
||||
|
||||
## Quants Usage
|
||||
|
||||
(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants)
|
||||
|
||||
Here is a handy graph by ikawrakow comparing some lower-quality quant
|
||||
types (lower is better):
|
||||
|
||||

|
||||
3
config.json
Normal file
3
config.json
Normal file
@@ -0,0 +1,3 @@
|
||||
{
|
||||
"model_type": "qwen3"
|
||||
}
|
||||
1
configuration.json
Normal file
1
configuration.json
Normal file
@@ -0,0 +1 @@
|
||||
{"framework": "pytorch", "task": "text-generation", "allow_remote": true}
|
||||
Reference in New Issue
Block a user