初始化项目,由ModelHub XC社区提供模型
Model: magiccodingman/Qwen3-4B-Instruct-2507-Unsloth-MagicQuant-v2-GGUF Source: Original Platform
This commit is contained in:
68
magicquant.hybrid-map.json
Normal file
68
magicquant.hybrid-map.json
Normal file
@@ -0,0 +1,68 @@
|
||||
[
|
||||
{
|
||||
"ExportedFileName": "Model-MQ-Q6_K_1.gguf",
|
||||
"DisplayName": "Model-MQ-Q6_K_1",
|
||||
"ProviderSource": "MagicQuant",
|
||||
"BaselineFamily": "Q6_K",
|
||||
"OriginalReferenceBaseline": "Q8_0",
|
||||
"TensorGroups": {
|
||||
"embeddings": "Q8_0",
|
||||
"attn_q": "Q8_0",
|
||||
"attn_kv": "Q8_0",
|
||||
"attn_output": "Q8_0",
|
||||
"ffn_up_gate": "Q6_K",
|
||||
"ffn_down": "Q8_0"
|
||||
},
|
||||
"EffectiveQuantStateKey": "base=standard:q8_0|attn_kv=effective:Q8_0|attn_output=effective:Q8_0|attn_q=effective:Q8_0|embeddings=effective:Q8_0|ffn_down=effective:Q8_0|ffn_up_gate=effective:Q6_K|lm_head=base|moe_experts=base|moe_router=base",
|
||||
"HasUnknownMappings": false,
|
||||
"Warnings": [],
|
||||
"UsedImatrix": true,
|
||||
"ExpectedSizeBytes": 3846147776,
|
||||
"ActualSizeBytes": 3846147776,
|
||||
"OriginalExternalSource": null
|
||||
},
|
||||
{
|
||||
"ExportedFileName": "Model-MQ-Q5_K_1.gguf",
|
||||
"DisplayName": "Model-MQ-Q5_K_1",
|
||||
"ProviderSource": "MagicQuant",
|
||||
"BaselineFamily": "Q5_K",
|
||||
"OriginalReferenceBaseline": "Q8_0",
|
||||
"TensorGroups": {
|
||||
"embeddings": "Q8_0",
|
||||
"attn_q": "Q6_K",
|
||||
"attn_kv": "Q8_0",
|
||||
"attn_output": "Q6_K",
|
||||
"ffn_up_gate": "UD-Q5_K_XL",
|
||||
"ffn_down": "Q5_K_S"
|
||||
},
|
||||
"EffectiveQuantStateKey": "base=standard:q8_0|attn_kv=effective:Q8_0|attn_output=effective:Q6_K|attn_q=effective:Q6_K|embeddings=effective:Q8_0|ffn_down=effective:Q5_K|ffn_up_gate=effective-map:0f95b03efeed21325cd9db1482ad29f6b4e758cb7c069d8a7e3e7dd34756d17f|lm_head=base|moe_experts=base|moe_router=base",
|
||||
"HasUnknownMappings": false,
|
||||
"Warnings": [],
|
||||
"UsedImatrix": true,
|
||||
"ExpectedSizeBytes": 3090906816,
|
||||
"ActualSizeBytes": 3090906816,
|
||||
"OriginalExternalSource": null
|
||||
},
|
||||
{
|
||||
"ExportedFileName": "Model-MQ-Q4_K_M_1.gguf",
|
||||
"DisplayName": "Model-MQ-Q4_K_M_1",
|
||||
"ProviderSource": "MagicQuant",
|
||||
"BaselineFamily": "Q4_K_M",
|
||||
"OriginalReferenceBaseline": "Q8_0",
|
||||
"TensorGroups": {
|
||||
"embeddings": "Q8_0",
|
||||
"attn_q": "Q5_K",
|
||||
"attn_kv": "Q8_0",
|
||||
"attn_output": "Q6_K",
|
||||
"ffn_up_gate": "IQ4_XS",
|
||||
"ffn_down": "IQ4_XS"
|
||||
},
|
||||
"EffectiveQuantStateKey": "base=standard:q8_0|attn_kv=effective:Q8_0|attn_output=effective:Q6_K|attn_q=effective:Q5_K|embeddings=effective:Q8_0|ffn_down=effective:IQ4_XS|ffn_up_gate=effective:IQ4_XS|lm_head=base|moe_experts=base|moe_router=base",
|
||||
"HasUnknownMappings": false,
|
||||
"Warnings": [],
|
||||
"UsedImatrix": true,
|
||||
"ExpectedSizeBytes": 2618576576,
|
||||
"ActualSizeBytes": 2618576576,
|
||||
"OriginalExternalSource": null
|
||||
}
|
||||
]
|
||||
Reference in New Issue
Block a user