475 lines
16 KiB
JSON
475 lines
16 KiB
JSON
|
|
[
|
||
|
|
{
|
||
|
|
"reasonCode": "SPACING_COLLAPSE",
|
||
|
|
"reasonDescription": "Two candidates were too close in practical output space; the stronger one was kept.",
|
||
|
|
"rawReason": "meaningful spacing collapse; size gap below 91,013,530 bytes",
|
||
|
|
"removed": {
|
||
|
|
"key": "0:1:0:3:1:2:102:14:0:0",
|
||
|
|
"fileName": "Model-MQ-Q5_K.gguf",
|
||
|
|
"displayName": "Model-MQ-Q5_K",
|
||
|
|
"shortName": "MQ-Q5_K",
|
||
|
|
"provider": "MagicQuant",
|
||
|
|
"quantFamily": "Q8_0",
|
||
|
|
"isHybrid": true,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.006925,
|
||
|
|
"ppl": 8.901754,
|
||
|
|
"pplDeltaPercent": 0.204354090683967,
|
||
|
|
"sizeBytes": 3040771776,
|
||
|
|
"sizeGiB": 2.831939399242401
|
||
|
|
},
|
||
|
|
"winner": {
|
||
|
|
"key": "0:1:0:2:1:2:102:14:0:0",
|
||
|
|
"fileName": "Model-MQ-Q5_K_1.gguf",
|
||
|
|
"displayName": "Model-MQ-Q5_K_1",
|
||
|
|
"shortName": "MQ-Q5_K_1",
|
||
|
|
"provider": "MagicQuant",
|
||
|
|
"quantFamily": "Q5_K",
|
||
|
|
"isHybrid": true,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.006632,
|
||
|
|
"ppl": 8.900069,
|
||
|
|
"pplDeltaPercent": 0.1853865550002334,
|
||
|
|
"sizeBytes": 3090906816,
|
||
|
|
"sizeGiB": 2.878631293773651
|
||
|
|
},
|
||
|
|
"deltas": {
|
||
|
|
"kld": 0.00029299999999999986,
|
||
|
|
"sizeBytes": -50135040,
|
||
|
|
"sizeGiB": -0.04669189453125,
|
||
|
|
"removedPplDeltaPercent": 0.204354090683967,
|
||
|
|
"winnerPplDeltaPercent": 0.1853865550002334,
|
||
|
|
"pplDeltaPercentImprovement": 0.018967535683733605
|
||
|
|
}
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"reasonCode": "SPACING_COLLAPSE",
|
||
|
|
"reasonDescription": "Two candidates were too close in practical output space; the stronger one was kept.",
|
||
|
|
"rawReason": "meaningful spacing collapse; size gap below 91,013,530 bytes",
|
||
|
|
"removed": {
|
||
|
|
"key": "2:0:0:0:0:0:0:0:0:0",
|
||
|
|
"fileName": "Model-LM-Q5_K.gguf",
|
||
|
|
"displayName": "Model-LM-Q5_K",
|
||
|
|
"shortName": "LM-Q5_K",
|
||
|
|
"provider": "llama.cpp",
|
||
|
|
"quantFamily": "Q5_K",
|
||
|
|
"isHybrid": false,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.009942,
|
||
|
|
"ppl": 8.896878,
|
||
|
|
"pplDeltaPercent": 0.14946643252735017,
|
||
|
|
"sizeBytes": 2889514176,
|
||
|
|
"sizeGiB": 2.691069781780243
|
||
|
|
},
|
||
|
|
"winner": {
|
||
|
|
"key": "101:0:0:0:0:0:0:0:0:0",
|
||
|
|
"fileName": "Model-UD-Q5_K_XL.gguf",
|
||
|
|
"displayName": "Model-UD-Q5_K_XL",
|
||
|
|
"shortName": "UD-Q5_K_XL",
|
||
|
|
"provider": "Unsloth",
|
||
|
|
"quantFamily": "UD-Q5_K_XL",
|
||
|
|
"isHybrid": false,
|
||
|
|
"isExternalPureBaseline": true,
|
||
|
|
"kld": 0.009839,
|
||
|
|
"ppl": 8.923979,
|
||
|
|
"pplDeltaPercent": 0.45453419784771626,
|
||
|
|
"sizeBytes": 2930382016,
|
||
|
|
"sizeGiB": 2.7291309237480164
|
||
|
|
},
|
||
|
|
"deltas": {
|
||
|
|
"kld": 0.00010299999999999893,
|
||
|
|
"sizeBytes": -40867840,
|
||
|
|
"sizeGiB": -0.03806114196777344,
|
||
|
|
"removedPplDeltaPercent": 0.14946643252735017,
|
||
|
|
"winnerPplDeltaPercent": 0.45453419784771626,
|
||
|
|
"pplDeltaPercentImprovement": -0.30506776532036606
|
||
|
|
}
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"reasonCode": "SPACING_COLLAPSE",
|
||
|
|
"reasonDescription": "Two candidates were too close in practical output space; the stronger one was kept.",
|
||
|
|
"rawReason": "meaningful spacing collapse; size gap below 91,013,530 bytes",
|
||
|
|
"removed": {
|
||
|
|
"key": "13:0:0:0:0:0:0:0:0:0",
|
||
|
|
"fileName": "Model-LM-Q5_K_S.gguf",
|
||
|
|
"displayName": "Model-LM-Q5_K_S",
|
||
|
|
"shortName": "LM-Q5_K_S",
|
||
|
|
"provider": "llama.cpp",
|
||
|
|
"quantFamily": "Q5_K_S",
|
||
|
|
"isHybrid": false,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.010808,
|
||
|
|
"ppl": 8.919999,
|
||
|
|
"pplDeltaPercent": 0.40973254086182603,
|
||
|
|
"sizeBytes": 2823711936,
|
||
|
|
"sizeGiB": 2.6297866702079773
|
||
|
|
},
|
||
|
|
"winner": {
|
||
|
|
"key": "2:0:0:0:0:0:0:0:0:0",
|
||
|
|
"fileName": "Model-LM-Q5_K.gguf",
|
||
|
|
"displayName": "Model-LM-Q5_K",
|
||
|
|
"shortName": "LM-Q5_K",
|
||
|
|
"provider": "llama.cpp",
|
||
|
|
"quantFamily": "Q5_K",
|
||
|
|
"isHybrid": false,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.009942,
|
||
|
|
"ppl": 8.896878,
|
||
|
|
"pplDeltaPercent": 0.14946643252735017,
|
||
|
|
"sizeBytes": 2889514176,
|
||
|
|
"sizeGiB": 2.691069781780243
|
||
|
|
},
|
||
|
|
"deltas": {
|
||
|
|
"kld": 0.0008660000000000004,
|
||
|
|
"sizeBytes": -65802240,
|
||
|
|
"sizeGiB": -0.061283111572265625,
|
||
|
|
"removedPplDeltaPercent": 0.40973254086182603,
|
||
|
|
"winnerPplDeltaPercent": 0.14946643252735017,
|
||
|
|
"pplDeltaPercentImprovement": 0.26026610833447583
|
||
|
|
}
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"reasonCode": "SPACING_COLLAPSE",
|
||
|
|
"reasonDescription": "Two candidates were too close in practical output space; the stronger one was kept.",
|
||
|
|
"rawReason": "meaningful spacing collapse; size gap below 91,013,530 bytes",
|
||
|
|
"removed": {
|
||
|
|
"key": "0:1:0:7:1:2:7:15:0:0",
|
||
|
|
"fileName": "Model-MQ-Q4_K_M.gguf",
|
||
|
|
"displayName": "Model-MQ-Q4_K_M",
|
||
|
|
"shortName": "MQ-Q4_K_M",
|
||
|
|
"provider": "MagicQuant",
|
||
|
|
"quantFamily": "Q8_0",
|
||
|
|
"isHybrid": true,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.021705,
|
||
|
|
"ppl": 8.964544,
|
||
|
|
"pplDeltaPercent": 0.9111621414741836,
|
||
|
|
"sizeBytes": 2600062656,
|
||
|
|
"sizeGiB": 2.4214970469474792
|
||
|
|
},
|
||
|
|
"winner": {
|
||
|
|
"key": "0:1:0:3:1:2:7:7:0:0",
|
||
|
|
"fileName": "Model-MQ-Q4_K_M_1.gguf",
|
||
|
|
"displayName": "Model-MQ-Q4_K_M_1",
|
||
|
|
"shortName": "MQ-Q4_K_M_1",
|
||
|
|
"provider": "MagicQuant",
|
||
|
|
"quantFamily": "Q4_K_M",
|
||
|
|
"isHybrid": true,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.020346,
|
||
|
|
"ppl": 8.95744,
|
||
|
|
"pplDeltaPercent": 0.8311945607636608,
|
||
|
|
"sizeBytes": 2618576576,
|
||
|
|
"sizeGiB": 2.4387394785881042
|
||
|
|
},
|
||
|
|
"deltas": {
|
||
|
|
"kld": 0.001358999999999999,
|
||
|
|
"sizeBytes": -18513920,
|
||
|
|
"sizeGiB": -0.017242431640625,
|
||
|
|
"removedPplDeltaPercent": 0.9111621414741836,
|
||
|
|
"winnerPplDeltaPercent": 0.8311945607636608,
|
||
|
|
"pplDeltaPercentImprovement": 0.07996758071052279
|
||
|
|
}
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"reasonCode": "NEAR_BASELINE_PREMIUM",
|
||
|
|
"reasonDescription": "The winner used only the configured near-baseline size premium and beat the real linear KLD trade line.",
|
||
|
|
"rawReason": "near-baseline replacement within \u002B1% size premium",
|
||
|
|
"removed": {
|
||
|
|
"key": "100:0:0:0:0:0:0:0:0:0",
|
||
|
|
"fileName": "Model-UD-Q4_K_XL.gguf",
|
||
|
|
"displayName": "Model-UD-Q4_K_XL",
|
||
|
|
"shortName": "UD-Q4_K_XL",
|
||
|
|
"provider": "Unsloth",
|
||
|
|
"quantFamily": "UD-Q4_K_XL",
|
||
|
|
"isHybrid": false,
|
||
|
|
"isExternalPureBaseline": true,
|
||
|
|
"kld": 0.022351,
|
||
|
|
"ppl": 8.997353,
|
||
|
|
"pplDeltaPercent": 1.2804831374668026,
|
||
|
|
"sizeBytes": 2591284416,
|
||
|
|
"sizeGiB": 2.4133216738700867
|
||
|
|
},
|
||
|
|
"winner": {
|
||
|
|
"key": "0:1:0:7:1:2:7:15:0:0",
|
||
|
|
"fileName": "Model-MQ-Q4_K_M.gguf",
|
||
|
|
"displayName": "Model-MQ-Q4_K_M",
|
||
|
|
"shortName": "MQ-Q4_K_M",
|
||
|
|
"provider": "MagicQuant",
|
||
|
|
"quantFamily": "Q8_0",
|
||
|
|
"isHybrid": true,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.021705,
|
||
|
|
"ppl": 8.964544,
|
||
|
|
"pplDeltaPercent": 0.9111621414741836,
|
||
|
|
"sizeBytes": 2600062656,
|
||
|
|
"sizeGiB": 2.4214970469474792
|
||
|
|
},
|
||
|
|
"deltas": {
|
||
|
|
"kld": 0.0006460000000000007,
|
||
|
|
"sizeBytes": -8778240,
|
||
|
|
"sizeGiB": -0.008175373077392578,
|
||
|
|
"removedPplDeltaPercent": 1.2804831374668026,
|
||
|
|
"winnerPplDeltaPercent": 0.9111621414741836,
|
||
|
|
"pplDeltaPercentImprovement": 0.36932099599261903
|
||
|
|
}
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"reasonCode": "SPACING_COLLAPSE",
|
||
|
|
"reasonDescription": "Two candidates were too close in practical output space; the stronger one was kept.",
|
||
|
|
"rawReason": "meaningful spacing collapse; size gap below 91,013,530 bytes",
|
||
|
|
"removed": {
|
||
|
|
"key": "100:0:0:0:0:0:0:0:0:0",
|
||
|
|
"fileName": "Model-UD-Q4_K_XL.gguf",
|
||
|
|
"displayName": "Model-UD-Q4_K_XL",
|
||
|
|
"shortName": "UD-Q4_K_XL",
|
||
|
|
"provider": "Unsloth",
|
||
|
|
"quantFamily": "UD-Q4_K_XL",
|
||
|
|
"isHybrid": false,
|
||
|
|
"isExternalPureBaseline": true,
|
||
|
|
"kld": 0.022351,
|
||
|
|
"ppl": 8.997353,
|
||
|
|
"pplDeltaPercent": 1.2804831374668026,
|
||
|
|
"sizeBytes": 2591284416,
|
||
|
|
"sizeGiB": 2.4133216738700867
|
||
|
|
},
|
||
|
|
"winner": {
|
||
|
|
"key": "0:1:0:7:1:2:7:15:0:0",
|
||
|
|
"fileName": "Model-MQ-Q4_K_M.gguf",
|
||
|
|
"displayName": "Model-MQ-Q4_K_M",
|
||
|
|
"shortName": "MQ-Q4_K_M",
|
||
|
|
"provider": "MagicQuant",
|
||
|
|
"quantFamily": "Q8_0",
|
||
|
|
"isHybrid": true,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.021705,
|
||
|
|
"ppl": 8.964544,
|
||
|
|
"pplDeltaPercent": 0.9111621414741836,
|
||
|
|
"sizeBytes": 2600062656,
|
||
|
|
"sizeGiB": 2.4214970469474792
|
||
|
|
},
|
||
|
|
"deltas": {
|
||
|
|
"kld": 0.0006460000000000007,
|
||
|
|
"sizeBytes": -8778240,
|
||
|
|
"sizeGiB": -0.008175373077392578,
|
||
|
|
"removedPplDeltaPercent": 1.2804831374668026,
|
||
|
|
"winnerPplDeltaPercent": 0.9111621414741836,
|
||
|
|
"pplDeltaPercentImprovement": 0.36932099599261903
|
||
|
|
}
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"reasonCode": "SPACING_COLLAPSE",
|
||
|
|
"reasonDescription": "Two candidates were too close in practical output space; the stronger one was kept.",
|
||
|
|
"rawReason": "meaningful spacing collapse; size gap below 91,013,530 bytes",
|
||
|
|
"removed": {
|
||
|
|
"key": "0:1:0:7:1:2:7:7:0:0",
|
||
|
|
"fileName": "Model-MQ-Q4_K_M.gguf",
|
||
|
|
"displayName": "Model-MQ-Q4_K_M",
|
||
|
|
"shortName": "MQ-Q4_K_M",
|
||
|
|
"provider": "MagicQuant",
|
||
|
|
"quantFamily": "Q8_0",
|
||
|
|
"isHybrid": true,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.023119,
|
||
|
|
"ppl": 8.965156,
|
||
|
|
"pplDeltaPercent": 0.9180512404881,
|
||
|
|
"sizeBytes": 2559594176,
|
||
|
|
"sizeGiB": 2.3838078379631042
|
||
|
|
},
|
||
|
|
"winner": {
|
||
|
|
"key": "100:0:0:0:0:0:0:0:0:0",
|
||
|
|
"fileName": "Model-UD-Q4_K_XL.gguf",
|
||
|
|
"displayName": "Model-UD-Q4_K_XL",
|
||
|
|
"shortName": "UD-Q4_K_XL",
|
||
|
|
"provider": "Unsloth",
|
||
|
|
"quantFamily": "UD-Q4_K_XL",
|
||
|
|
"isHybrid": false,
|
||
|
|
"isExternalPureBaseline": true,
|
||
|
|
"kld": 0.022351,
|
||
|
|
"ppl": 8.997353,
|
||
|
|
"pplDeltaPercent": 1.2804831374668026,
|
||
|
|
"sizeBytes": 2591284416,
|
||
|
|
"sizeGiB": 2.4133216738700867
|
||
|
|
},
|
||
|
|
"deltas": {
|
||
|
|
"kld": 0.0007680000000000013,
|
||
|
|
"sizeBytes": -31690240,
|
||
|
|
"sizeGiB": -0.029513835906982422,
|
||
|
|
"removedPplDeltaPercent": 0.9180512404881,
|
||
|
|
"winnerPplDeltaPercent": 1.2804831374668026,
|
||
|
|
"pplDeltaPercentImprovement": -0.3624318969787026
|
||
|
|
}
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"reasonCode": "SPACING_COLLAPSE",
|
||
|
|
"reasonDescription": "Two candidates were too close in practical output space; the stronger one was kept.",
|
||
|
|
"rawReason": "meaningful spacing collapse; size gap below 91,013,530 bytes",
|
||
|
|
"removed": {
|
||
|
|
"key": "3:0:0:0:0:0:0:0:0:0",
|
||
|
|
"fileName": "Model-LM-Q4_K_M.gguf",
|
||
|
|
"displayName": "Model-LM-Q4_K_M",
|
||
|
|
"shortName": "LM-Q4_K_M",
|
||
|
|
"provider": "llama.cpp",
|
||
|
|
"quantFamily": "Q4_K_M",
|
||
|
|
"isHybrid": false,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.025432,
|
||
|
|
"ppl": 9.030426,
|
||
|
|
"pplDeltaPercent": 1.6527759016614976,
|
||
|
|
"sizeBytes": 2497281216,
|
||
|
|
"sizeGiB": 2.325774371623993
|
||
|
|
},
|
||
|
|
"winner": {
|
||
|
|
"key": "0:1:0:7:1:2:7:7:0:0",
|
||
|
|
"fileName": "Model-MQ-Q4_K_M.gguf",
|
||
|
|
"displayName": "Model-MQ-Q4_K_M",
|
||
|
|
"shortName": "MQ-Q4_K_M",
|
||
|
|
"provider": "MagicQuant",
|
||
|
|
"quantFamily": "Q8_0",
|
||
|
|
"isHybrid": true,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.023119,
|
||
|
|
"ppl": 8.965156,
|
||
|
|
"pplDeltaPercent": 0.9180512404881,
|
||
|
|
"sizeBytes": 2559594176,
|
||
|
|
"sizeGiB": 2.3838078379631042
|
||
|
|
},
|
||
|
|
"deltas": {
|
||
|
|
"kld": 0.002312999999999999,
|
||
|
|
"sizeBytes": -62312960,
|
||
|
|
"sizeGiB": -0.05803346633911133,
|
||
|
|
"removedPplDeltaPercent": 1.6527759016614976,
|
||
|
|
"winnerPplDeltaPercent": 0.9180512404881,
|
||
|
|
"pplDeltaPercentImprovement": 0.7347246611733975
|
||
|
|
}
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"reasonCode": "SPACING_COLLAPSE",
|
||
|
|
"reasonDescription": "Two candidates were too close in practical output space; the stronger one was kept.",
|
||
|
|
"rawReason": "meaningful spacing collapse; size gap below 91,013,530 bytes",
|
||
|
|
"removed": {
|
||
|
|
"key": "5:0:0:0:0:0:0:0:0:0",
|
||
|
|
"fileName": "Model-LM-IQ4_NL.gguf",
|
||
|
|
"displayName": "Model-LM-IQ4_NL",
|
||
|
|
"shortName": "LM-IQ4_NL",
|
||
|
|
"provider": "llama.cpp",
|
||
|
|
"quantFamily": "IQ4_NL",
|
||
|
|
"isHybrid": false,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.030626,
|
||
|
|
"ppl": 8.946429,
|
||
|
|
"pplDeltaPercent": 0.7072470620018989,
|
||
|
|
"sizeBytes": 2381343936,
|
||
|
|
"sizeGiB": 2.2177993655204773
|
||
|
|
},
|
||
|
|
"winner": {
|
||
|
|
"key": "14:0:0:0:0:0:0:0:0:0",
|
||
|
|
"fileName": "Model-LM-Q4_K_S.gguf",
|
||
|
|
"displayName": "Model-LM-Q4_K_S",
|
||
|
|
"shortName": "LM-Q4_K_S",
|
||
|
|
"provider": "llama.cpp",
|
||
|
|
"quantFamily": "Q4_K_S",
|
||
|
|
"isHybrid": false,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.029803,
|
||
|
|
"ppl": 9.010033,
|
||
|
|
"pplDeltaPercent": 1.4232180647485306,
|
||
|
|
"sizeBytes": 2383310016,
|
||
|
|
"sizeGiB": 2.2196304202079773
|
||
|
|
},
|
||
|
|
"deltas": {
|
||
|
|
"kld": 0.0008230000000000008,
|
||
|
|
"sizeBytes": -1966080,
|
||
|
|
"sizeGiB": -0.0018310546875,
|
||
|
|
"removedPplDeltaPercent": 0.7072470620018989,
|
||
|
|
"winnerPplDeltaPercent": 1.4232180647485306,
|
||
|
|
"pplDeltaPercentImprovement": -0.7159710027466317
|
||
|
|
}
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"reasonCode": "SPACING_COLLAPSE",
|
||
|
|
"reasonDescription": "Two candidates were too close in practical output space; the stronger one was kept.",
|
||
|
|
"rawReason": "meaningful spacing collapse; size gap below 91,013,530 bytes",
|
||
|
|
"removed": {
|
||
|
|
"key": "8:0:0:0:0:0:0:0:0:0",
|
||
|
|
"fileName": "Model-LM-IQ3_XS.gguf",
|
||
|
|
"displayName": "Model-LM-IQ3_XS",
|
||
|
|
"shortName": "LM-IQ3_XS",
|
||
|
|
"provider": "llama.cpp",
|
||
|
|
"quantFamily": "IQ3_XS",
|
||
|
|
"isHybrid": false,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.11761,
|
||
|
|
"ppl": 9.485851,
|
||
|
|
"pplDeltaPercent": 6.779357467693287,
|
||
|
|
"sizeBytes": 1814375616,
|
||
|
|
"sizeGiB": 1.6897689700126648
|
||
|
|
},
|
||
|
|
"winner": {
|
||
|
|
"key": "7:0:0:0:0:0:0:0:0:0",
|
||
|
|
"fileName": "Model-LM-IQ3_S.gguf",
|
||
|
|
"displayName": "Model-LM-IQ3_S",
|
||
|
|
"shortName": "LM-IQ3_S",
|
||
|
|
"provider": "llama.cpp",
|
||
|
|
"quantFamily": "IQ3_S",
|
||
|
|
"isHybrid": false,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.091992,
|
||
|
|
"ppl": 9.349099,
|
||
|
|
"pplDeltaPercent": 5.239981539015728,
|
||
|
|
"sizeBytes": 1899531456,
|
||
|
|
"sizeGiB": 1.7690765261650085
|
||
|
|
},
|
||
|
|
"deltas": {
|
||
|
|
"kld": 0.025618000000000002,
|
||
|
|
"sizeBytes": -85155840,
|
||
|
|
"sizeGiB": -0.07930755615234375,
|
||
|
|
"removedPplDeltaPercent": 6.779357467693287,
|
||
|
|
"winnerPplDeltaPercent": 5.239981539015728,
|
||
|
|
"pplDeltaPercentImprovement": 1.5393759286775586
|
||
|
|
}
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"reasonCode": "SPACING_COLLAPSE",
|
||
|
|
"reasonDescription": "Two candidates were too close in practical output space; the stronger one was kept.",
|
||
|
|
"rawReason": "meaningful spacing collapse; size gap below 91,013,530 bytes",
|
||
|
|
"removed": {
|
||
|
|
"key": "11:0:0:0:0:0:0:0:0:0",
|
||
|
|
"fileName": "Model-LM-IQ2_XS.gguf",
|
||
|
|
"displayName": "Model-LM-IQ2_XS",
|
||
|
|
"shortName": "LM-IQ2_XS",
|
||
|
|
"provider": "llama.cpp",
|
||
|
|
"quantFamily": "IQ2_XS",
|
||
|
|
"isHybrid": false,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.529564,
|
||
|
|
"ppl": 13.498521,
|
||
|
|
"pplDeltaPercent": 51.94877076860733,
|
||
|
|
"sizeBytes": 1354100416,
|
||
|
|
"sizeGiB": 1.2611042857170105
|
||
|
|
},
|
||
|
|
"winner": {
|
||
|
|
"key": "10:0:0:0:0:0:0:0:0:0",
|
||
|
|
"fileName": "Model-LM-IQ2_S.gguf",
|
||
|
|
"displayName": "Model-LM-IQ2_S",
|
||
|
|
"shortName": "LM-IQ2_S",
|
||
|
|
"provider": "llama.cpp",
|
||
|
|
"quantFamily": "IQ2_S",
|
||
|
|
"isHybrid": false,
|
||
|
|
"isExternalPureBaseline": false,
|
||
|
|
"kld": 0.431128,
|
||
|
|
"ppl": 12.334448,
|
||
|
|
"pplDeltaPercent": 38.84515286595525,
|
||
|
|
"sizeBytes": 1417301696,
|
||
|
|
"sizeGiB": 1.3199650645256042
|
||
|
|
},
|
||
|
|
"deltas": {
|
||
|
|
"kld": 0.09843600000000002,
|
||
|
|
"sizeBytes": -63201280,
|
||
|
|
"sizeGiB": -0.05886077880859375,
|
||
|
|
"removedPplDeltaPercent": 51.94877076860733,
|
||
|
|
"winnerPplDeltaPercent": 38.84515286595525,
|
||
|
|
"pplDeltaPercentImprovement": 13.103617902652083
|
||
|
|
}
|
||
|
|
}
|
||
|
|
]
|