初始化项目,由ModelHub XC社区提供模型
Model: calcuis/phi3 Source: Original Platform
This commit is contained in:
53
.gitattributes
vendored
Normal file
53
.gitattributes
vendored
Normal file
@@ -0,0 +1,53 @@
|
|||||||
|
*.7z filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.arrow filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.bin filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.ftz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.gz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.h5 filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.joblib filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.model filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.npy filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.npz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.parquet filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pb filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pickle filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pkl filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pt filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pth filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.rar filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
||||||
|
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.tar filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.tflite filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.tgz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.wasm filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.xz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_q8_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_tq1_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_tq2_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_q2_k.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_q3_k_m.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_q4_k_m.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_q5_k_m.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_q6_k.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_f16.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_f32.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_q4_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_q4_1.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_q5_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_q5_1.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_q3_k_l.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_q3_k_s.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_q4_k_s.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
phi3_q5_k_s.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
32
README.md
Normal file
32
README.md
Normal file
@@ -0,0 +1,32 @@
|
|||||||
|
---
|
||||||
|
license: mit
|
||||||
|
language:
|
||||||
|
- en
|
||||||
|
base_model:
|
||||||
|
- microsoft/Phi-3-mini-128k-instruct
|
||||||
|
pipeline_tag: text-generation
|
||||||
|
---
|
||||||
|
|
||||||
|
## GGUF quantized version of Phi-3 Model (128k-instruct mini)
|
||||||
|
|
||||||
|
project original [source](https://huggingface.co/microsoft/Phi-3-mini-128k-instruct) (base model)
|
||||||
|
|
||||||
|
Q_2 (not nice)
|
||||||
|
|
||||||
|
Q_3 (acceptable)
|
||||||
|
|
||||||
|
Q_4 family is recommanded (good for running with CPU as well)
|
||||||
|
|
||||||
|
Q_5 (good in general)
|
||||||
|
|
||||||
|
Q_6 is good also; if you want a better result; take this one instead of Q_5
|
||||||
|
|
||||||
|
Q_8 which is very good; need a reasonable size of RAM otherwise you might expect a long wait
|
||||||
|
|
||||||
|
16-bit and 32-bit are also provided here for research perspectives; since the file size (16bit) is similar to the original safetensors; once you have a GPU, go ahead with the safetensors, pretty much the same
|
||||||
|
|
||||||
|
### how to run it
|
||||||
|
|
||||||
|
use any connector for interacting with gguf; i.e., [gguf-connector](https://pypi.org/project/gguf-connector/)
|
||||||
|
|
||||||
|
welcome to ai era
|
||||||
1
configuration.json
Normal file
1
configuration.json
Normal file
@@ -0,0 +1 @@
|
|||||||
|
{"framework": "pytorch", "task": "text-generation", "allow_remote": true}
|
||||||
3
phi3_f16.gguf
Normal file
3
phi3_f16.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:1c56ff08a9b489d94795626e3e1859345cb615bda00d3d81c2852a716bf8d737
|
||||||
|
size 7643297248
|
||||||
3
phi3_f32.gguf
Normal file
3
phi3_f32.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:08fd99046be952d0b9e8a0c5c991f3a6864f52b7b3ffc23f39dd988cf2428507
|
||||||
|
size 15285056992
|
||||||
3
phi3_q2_k.gguf
Normal file
3
phi3_q2_k.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:7f77f943e8802e482fe866fc418c9b4663d9301ab5ea3a01ff3f711be149056d
|
||||||
|
size 1416204256
|
||||||
3
phi3_q3_k_l.gguf
Normal file
3
phi3_q3_k_l.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:5776245e5c071961dc4ab9bdaed41bc6804727f8a13dc47f45452a98c088f621
|
||||||
|
size 2087597536
|
||||||
3
phi3_q3_k_m.gguf
Normal file
3
phi3_q3_k_m.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:1836d3292d005cdc07184e8f94690460cc9c6cf3b7eff3486caba62cd6fc4af1
|
||||||
|
size 1955476960
|
||||||
3
phi3_q3_k_s.gguf
Normal file
3
phi3_q3_k_s.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:701fc0908faafc84b3d86be86b983cccd25be84e2bc15acf1ba5baf989e5dbf0
|
||||||
|
size 1681798624
|
||||||
3
phi3_q4_0.gguf
Normal file
3
phi3_q4_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:48ad47a65b166d1f8b077c06d4e7612bd58ec914fa0d476f1b68f0eb4a70b9c5
|
||||||
|
size 2176177120
|
||||||
3
phi3_q4_1.gguf
Normal file
3
phi3_q4_1.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:dda1cbcc031069c80626ede68a8c273ce64f69a6a95ad6dfacd558c7d345e337
|
||||||
|
size 2408825824
|
||||||
3
phi3_q4_k_m.gguf
Normal file
3
phi3_q4_k_m.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:48ad47a65b166d1f8b077c06d4e7612bd58ec914fa0d476f1b68f0eb4a70b9c5
|
||||||
|
size 2176177120
|
||||||
3
phi3_q4_k_s.gguf
Normal file
3
phi3_q4_k_s.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:d736d46af9edaeafad2b8939639a8835ae72e4dda3c18701e363eb142581e375
|
||||||
|
size 2188760032
|
||||||
3
phi3_q5_0.gguf
Normal file
3
phi3_q5_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:55a604f08194daa76e90f7f8f75bb0712a72ba2906a32231d7f882d96b417fa7
|
||||||
|
size 2641474528
|
||||||
3
phi3_q5_1.gguf
Normal file
3
phi3_q5_1.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:743b208fa089b1a9e27a25a8d822522944b7ddbac08a991729789f1695f6787f
|
||||||
|
size 2874123232
|
||||||
3
phi3_q5_k_m.gguf
Normal file
3
phi3_q5_k_m.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:9f3970619392752c402bbb1b53d3d09326c1f02b1b83ae6374d672307db330f5
|
||||||
|
size 2815276000
|
||||||
3
phi3_q5_k_s.gguf
Normal file
3
phi3_q5_k_s.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:dc2698ef8ec718dd507884522e10d44ab8d7773c9b781d241cdc5271c5568959
|
||||||
|
size 2641474528
|
||||||
3
phi3_q6_k.gguf
Normal file
3
phi3_q6_k.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:7da61563618da640141f88d10c04ea2408455324202bbf893fe91b0364d6ed93
|
||||||
|
size 3135853024
|
||||||
3
phi3_q8_0.gguf
Normal file
3
phi3_q8_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:ff469a8262b93af869d457cb94b4e87e64a424f9dd1663082d6084cb11418f3a
|
||||||
|
size 4061222368
|
||||||
3
phi3_tq1_0.gguf
Normal file
3
phi3_tq1_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:ff409fb51328897f5298d13fa220c55aed1c93fac8e86c664ad2999bb5effb2d
|
||||||
|
size 1159951840
|
||||||
3
phi3_tq2_0.gguf
Normal file
3
phi3_tq2_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:12da0d47aabf31f62295aee59cd7a55723e179aef59443316aaaff2bebbaeead
|
||||||
|
size 1329821152
|
||||||
Reference in New Issue
Block a user