Model: magiccodingman/Qwen3-4B-Instruct-2507-Unsloth-MagicQuant-v2-GGUF Source: Original Platform
68 lines
2.5 KiB
JSON
68 lines
2.5 KiB
JSON
[
|
|
{
|
|
"ExportedFileName": "Model-MQ-Q6_K_1.gguf",
|
|
"DisplayName": "Model-MQ-Q6_K_1",
|
|
"ProviderSource": "MagicQuant",
|
|
"BaselineFamily": "Q6_K",
|
|
"OriginalReferenceBaseline": "Q8_0",
|
|
"TensorGroups": {
|
|
"embeddings": "Q8_0",
|
|
"attn_q": "Q8_0",
|
|
"attn_kv": "Q8_0",
|
|
"attn_output": "Q8_0",
|
|
"ffn_up_gate": "Q6_K",
|
|
"ffn_down": "Q8_0"
|
|
},
|
|
"EffectiveQuantStateKey": "base=standard:q8_0|attn_kv=effective:Q8_0|attn_output=effective:Q8_0|attn_q=effective:Q8_0|embeddings=effective:Q8_0|ffn_down=effective:Q8_0|ffn_up_gate=effective:Q6_K|lm_head=base|moe_experts=base|moe_router=base",
|
|
"HasUnknownMappings": false,
|
|
"Warnings": [],
|
|
"UsedImatrix": true,
|
|
"ExpectedSizeBytes": 3846147776,
|
|
"ActualSizeBytes": 3846147776,
|
|
"OriginalExternalSource": null
|
|
},
|
|
{
|
|
"ExportedFileName": "Model-MQ-Q5_K_1.gguf",
|
|
"DisplayName": "Model-MQ-Q5_K_1",
|
|
"ProviderSource": "MagicQuant",
|
|
"BaselineFamily": "Q5_K",
|
|
"OriginalReferenceBaseline": "Q8_0",
|
|
"TensorGroups": {
|
|
"embeddings": "Q8_0",
|
|
"attn_q": "Q6_K",
|
|
"attn_kv": "Q8_0",
|
|
"attn_output": "Q6_K",
|
|
"ffn_up_gate": "UD-Q5_K_XL",
|
|
"ffn_down": "Q5_K_S"
|
|
},
|
|
"EffectiveQuantStateKey": "base=standard:q8_0|attn_kv=effective:Q8_0|attn_output=effective:Q6_K|attn_q=effective:Q6_K|embeddings=effective:Q8_0|ffn_down=effective:Q5_K|ffn_up_gate=effective-map:0f95b03efeed21325cd9db1482ad29f6b4e758cb7c069d8a7e3e7dd34756d17f|lm_head=base|moe_experts=base|moe_router=base",
|
|
"HasUnknownMappings": false,
|
|
"Warnings": [],
|
|
"UsedImatrix": true,
|
|
"ExpectedSizeBytes": 3090906816,
|
|
"ActualSizeBytes": 3090906816,
|
|
"OriginalExternalSource": null
|
|
},
|
|
{
|
|
"ExportedFileName": "Model-MQ-Q4_K_M_1.gguf",
|
|
"DisplayName": "Model-MQ-Q4_K_M_1",
|
|
"ProviderSource": "MagicQuant",
|
|
"BaselineFamily": "Q4_K_M",
|
|
"OriginalReferenceBaseline": "Q8_0",
|
|
"TensorGroups": {
|
|
"embeddings": "Q8_0",
|
|
"attn_q": "Q5_K",
|
|
"attn_kv": "Q8_0",
|
|
"attn_output": "Q6_K",
|
|
"ffn_up_gate": "IQ4_XS",
|
|
"ffn_down": "IQ4_XS"
|
|
},
|
|
"EffectiveQuantStateKey": "base=standard:q8_0|attn_kv=effective:Q8_0|attn_output=effective:Q6_K|attn_q=effective:Q5_K|embeddings=effective:Q8_0|ffn_down=effective:IQ4_XS|ffn_up_gate=effective:IQ4_XS|lm_head=base|moe_experts=base|moe_router=base",
|
|
"HasUnknownMappings": false,
|
|
"Warnings": [],
|
|
"UsedImatrix": true,
|
|
"ExpectedSizeBytes": 2618576576,
|
|
"ActualSizeBytes": 2618576576,
|
|
"OriginalExternalSource": null
|
|
}
|
|
] |