初始化项目,由ModelHub XC社区提供模型
Model: prithivMLmods/II-Search-4B-GGUF Source: Original Platform
This commit is contained in:
3
II-Search-4B-GGUF.BF16.gguf
Normal file
3
II-Search-4B-GGUF.BF16.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:c0afd3ec99ab9d679c5072e3fe4761f27d979ef2c2b76067bb4a906bb81c4070
|
||||
size 8051284128
|
||||
3
II-Search-4B-GGUF.F16.gguf
Normal file
3
II-Search-4B-GGUF.F16.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:c64e2548df5eb00421c021151406a3a86b81519f1682400eac0731ac7408156c
|
||||
size 8051284128
|
||||
3
II-Search-4B-GGUF.F32.gguf
Normal file
3
II-Search-4B-GGUF.F32.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:5e85d14f21a262cf63587fc1afd9d116421146cf277a4efe9617ef267314f031
|
||||
size 16095828128
|
||||
3
II-Search-4B-GGUF.Q2_K.gguf
Normal file
3
II-Search-4B-GGUF.Q2_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:1adb27ac90f90168ca582219e846f8a7a69735ffda8d55542eb565fcb78d6c24
|
||||
size 1669498528
|
||||
3
II-Search-4B-GGUF.Q3_K_L.gguf
Normal file
3
II-Search-4B-GGUF.Q3_K_L.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:490c65e827dc607711679b1cdc8712d9f25379adab0c564b977eaebf914418e9
|
||||
size 2239784608
|
||||
3
II-Search-4B-GGUF.Q3_K_M.gguf
Normal file
3
II-Search-4B-GGUF.Q3_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:b64b5d7bca3a84bafd5e92da271736eb6a19924a74a376b668aa99ec8d347771
|
||||
size 2075616928
|
||||
3
II-Search-4B-GGUF.Q3_K_S.gguf
Normal file
3
II-Search-4B-GGUF.Q3_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:bca25ab3cd36e990e75d8eee06e78af1149fdfe8c1c73393b4098b9ff77039ca
|
||||
size 1886996128
|
||||
3
II-Search-4B-GGUF.Q4_K_M.gguf
Normal file
3
II-Search-4B-GGUF.Q4_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:58e75048dce14e6d367bc832b224947b47c8b360dcb5672ea2d558b6daf2e6d4
|
||||
size 2497279648
|
||||
3
II-Search-4B-GGUF.Q4_K_S.gguf
Normal file
3
II-Search-4B-GGUF.Q4_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:99eec28e15d33fed0b5b1be1e9f57a326fba968c6fbb66d6d12ed5842cf88bc0
|
||||
size 2383308448
|
||||
3
II-Search-4B-GGUF.Q5_K_M.gguf
Normal file
3
II-Search-4B-GGUF.Q5_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:e9f9bf335b639d7647839294adadd5b6c3bf6429820a3d14ecfe39d814f32592
|
||||
size 2889512608
|
||||
3
II-Search-4B-GGUF.Q5_K_S.gguf
Normal file
3
II-Search-4B-GGUF.Q5_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:da208386aaadeaba08e1aedbe3cef1c7325201140cd97fdf87109ea889c62e5f
|
||||
size 2823710368
|
||||
3
II-Search-4B-GGUF.Q6_K.gguf
Normal file
3
II-Search-4B-GGUF.Q6_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:36688004299fa63c8abcb3607a2dbd008c03192865ee0a54815076a56804c519
|
||||
size 3306260128
|
||||
3
II-Search-4B-GGUF.Q8_0.gguf
Normal file
3
II-Search-4B-GGUF.Q8_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:bf8333e13b348832cac8df7f6e15b722f91fe777496bb09d2f0152742f6cc849
|
||||
size 4280404128
|
||||
47
.gitattributes
vendored
Normal file
47
.gitattributes
vendored
Normal file
@@ -0,0 +1,47 @@
|
||||
*.7z filter=lfs diff=lfs merge=lfs -text
|
||||
*.arrow filter=lfs diff=lfs merge=lfs -text
|
||||
*.bin filter=lfs diff=lfs merge=lfs -text
|
||||
*.bin.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
||||
*.ftz filter=lfs diff=lfs merge=lfs -text
|
||||
*.gz filter=lfs diff=lfs merge=lfs -text
|
||||
*.h5 filter=lfs diff=lfs merge=lfs -text
|
||||
*.joblib filter=lfs diff=lfs merge=lfs -text
|
||||
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.model filter=lfs diff=lfs merge=lfs -text
|
||||
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||
*.parquet filter=lfs diff=lfs merge=lfs -text
|
||||
*.pb filter=lfs diff=lfs merge=lfs -text
|
||||
*.pt filter=lfs diff=lfs merge=lfs -text
|
||||
*.pth filter=lfs diff=lfs merge=lfs -text
|
||||
*.rar filter=lfs diff=lfs merge=lfs -text
|
||||
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tflite filter=lfs diff=lfs merge=lfs -text
|
||||
*.tgz filter=lfs diff=lfs merge=lfs -text
|
||||
*.xz filter=lfs diff=lfs merge=lfs -text
|
||||
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||
*.zstandard filter=lfs diff=lfs merge=lfs -text
|
||||
*.tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||
*.db* filter=lfs diff=lfs merge=lfs -text
|
||||
*.ark* filter=lfs diff=lfs merge=lfs -text
|
||||
**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text
|
||||
**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text
|
||||
**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text
|
||||
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
||||
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
||||
*.gguf* filter=lfs diff=lfs merge=lfs -text
|
||||
*.ggml filter=lfs diff=lfs merge=lfs -text
|
||||
*.llamafile* filter=lfs diff=lfs merge=lfs -text
|
||||
*.pt2 filter=lfs diff=lfs merge=lfs -text
|
||||
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
||||
*.npy filter=lfs diff=lfs merge=lfs -text
|
||||
*.npz filter=lfs diff=lfs merge=lfs -text
|
||||
*.pickle filter=lfs diff=lfs merge=lfs -text
|
||||
*.pkl filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar filter=lfs diff=lfs merge=lfs -text
|
||||
*.wasm filter=lfs diff=lfs merge=lfs -text
|
||||
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||
42
README.md
Normal file
42
README.md
Normal file
@@ -0,0 +1,42 @@
|
||||
---
|
||||
license: apache-2.0
|
||||
base_model:
|
||||
- Intelligent-Internet/II-Search-4B
|
||||
language:
|
||||
- en
|
||||
pipeline_tag: text-generation
|
||||
library_name: transformers
|
||||
tags:
|
||||
- text-generation-inference
|
||||
---
|
||||
|
||||
# **II-Search-4B-GGUF**
|
||||
|
||||
> II-Search-4B is a 4-billion-parameter language model fine-tuned from Qwen3-4B specifically for advanced information seeking and web-integrated reasoning tasks, demonstrating strong capabilities in multi-hop information retrieval, fact verification, and comprehensive report generation; it excels on factual QA benchmarks compared to peers, features sophisticated tool-use for search and web visits, supports distributed inference with vLLM or SGLang (including a 131,072-token context window with custom RoPE scaling), and is suitable for factual question answering, research assistance, and educational applications, with Apple Silicon support via MLX, open integration examples, and full resources available on its Hugging Face repository.
|
||||
|
||||
# Model Files
|
||||
|
||||
| File Name | Size | Quant Type |
|
||||
|-----------|------|------------|
|
||||
| II-Search-4B-GGUF.BF16.gguf | 8.05 GB | BF16 |
|
||||
| II-Search-4B-GGUF.F16.gguf | 8.05 GB | F16 |
|
||||
| II-Search-4B-GGUF.F32.gguf | 16.1 GB | F32 |
|
||||
| II-Search-4B-GGUF.Q2_K.gguf | 1.67 GB | Q2_K |
|
||||
| II-Search-4B-GGUF.Q3_K_L.gguf | 2.24 GB | Q3_K_L |
|
||||
| II-Search-4B-GGUF.Q3_K_M.gguf | 2.08 GB | Q3_K_M |
|
||||
| II-Search-4B-GGUF.Q3_K_S.gguf | 1.89 GB | Q3_K_S |
|
||||
| II-Search-4B-GGUF.Q4_K_M.gguf | 2.5 GB | Q4_K_M |
|
||||
| II-Search-4B-GGUF.Q4_K_S.gguf | 2.38 GB | Q4_K_S |
|
||||
| II-Search-4B-GGUF.Q5_K_M.gguf | 2.89 GB | Q5_K_M |
|
||||
| II-Search-4B-GGUF.Q5_K_S.gguf | 2.82 GB | Q5_K_S |
|
||||
| II-Search-4B-GGUF.Q6_K.gguf | 3.31 GB | Q6_K |
|
||||
| II-Search-4B-GGUF.Q8_0.gguf | 4.28 GB | Q8_0 |
|
||||
|
||||
## Quants Usage
|
||||
|
||||
(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants)
|
||||
|
||||
Here is a handy graph by ikawrakow comparing some lower-quality quant
|
||||
types (lower is better):
|
||||
|
||||

|
||||
3
config.json
Normal file
3
config.json
Normal file
@@ -0,0 +1,3 @@
|
||||
{
|
||||
"model_type": "qwen3"
|
||||
}
|
||||
1
configuration.json
Normal file
1
configuration.json
Normal file
@@ -0,0 +1 @@
|
||||
{"framework": "pytorch", "task": "text-generation", "allow_remote": true}
|
||||
Reference in New Issue
Block a user