初始化项目，由ModelHub XC社区提供模型

Model: eaddario/granite-4.1-8b-GGUF Source: Original Platform
2026-06-14 00:38:20 +08:00
commit a947aa221e
80 changed files with 12432 additions and 0 deletions
--- a/.gitattributes
+++ b/.gitattributes
@@ -0,0 +1,38 @@
+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+*.gguf filter=lfs diff=lfs merge=lfs -text
+*.logits filter=lfs diff=lfs merge=lfs -text
+*.dat filter=lfs diff=lfs merge=lfs -text
+*.bpw_state filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text
--- a/.gitignore
+++ b/.gitignore
@@ -0,0 +1,584 @@
+# https://github.com/github/gitignore
+
+# -------------
+# General Linux
+# -------------
+.directory
+.fuse_hidden*
+.nfs*
+.Trash-*
+*~
+
+# -----------
+# General OSX
+# -----------
+._*
+.apdisk
+.AppleDB
+.AppleDesktop
+.AppleDouble
+.com.apple.timemachine.donotpresent
+.DocumentRevisions-V100
+.DS_Store
+.fseventsd
+.LSOverride
+.Spotlight-V100
+.TemporaryItems
+.Trashes
+.VolumeIcon.icns
+Network Trash Folder
+Temporary Items
+
+# ---------------
+# General Windows
+# ---------------
+[Dd]esktop.ini
+*.cab
+*.lnk
+*.msi
+*.msix
+*.msm
+*.msp
+*.stackdump
+$RECYCLE.BIN/
+ehthumbs_vista.db
+ehthumbs.db
+Thumbs.db
+Thumbs.db:encryptable
+
+# -----------------
+# General JetBrains
+# -----------------
+.idea_modules/
+.idea/
+*.iml
+*.ipr
+*.iws
+
+# ---------------
+# General VS Code
+# ---------------
+!.vscode/*.code-snippets
+!.vscode/extensions.json
+!.vscode/launch.json
+!.vscode/settings.json
+!.vscode/tasks.json
+.history/
+.vscode/
+*.vsix
+
+# ---------------------
+# General Visual Studio
+# ---------------------
+__pycache__/
+_NCrunch_*
+_pkginfo.txt
+_Pvt_Extensions
+_ReSharper*/
+_TeamCity*
+_UpgradeReport_Files/
+!?*.[Cc]ache/
+!.vscode/extensions.json
+!**/[Pp]ackages/build/
+.*crunch*.local.xml
+.builds
+.cr/personal
+.fake/
+.ionide/
+.localhistory/
+.mfractor/
+.ntvs_analysis.dat
+.paket/paket.exe
+.sass-cache/
+.vs/
+.vscode/*
+.vshistory/
+[Aa][Rr][Mm]/
+[Aa][Rr][Mm]64/
+[Bb]in/
+[Bb]uild[Ll]og.*
+[Dd]ebug/
+[Dd]ebugPS/
+[Dd]ebugPublic/
+[Ee]xpress/
+[Ll]og/
+[Ll]ogs/
+[Oo]bj/
+[Rr]elease/
+[Rr]eleasePS/
+[Rr]eleases/
+[Tt]est[Rr]esult*/
+[Ww][Ii][Nn]32/
+*_h.h
+*_i.c
+*_p.c
+*_wpftmp.csproj
+*- [Bb]ackup ([0-9]).rdl
+*- [Bb]ackup ([0-9][0-9]).rdl
+*- [Bb]ackup.rdl
+*.[Cc]ache
+*.[Pp]ublish.xml
+*.[Rr]e[Ss]harper
+*.appx
+*.appxbundle
+*.appxupload
+*.aps
+*.azurePubxml
+*.bim_*.settings
+*.bim.layout
+*.binlog
+*.btm.cs
+*.btp.cs
+*.build.csdef
+*.cachefile
+*.code-workspace
+*.coverage
+*.coveragexml
+*.dbmdl
+*.dbproj.schemaview
+*.dotCover
+*.DotSettings.user
+*.dsp
+*.dsw
+*.e2e
+*.GhostDoc.xml
+*.gpState
+*.ilk
+*.iobj
+*.ipdb
+*.jfm
+*.jmconfig
+*.ldf
+*.mdf
+*.meta
+*.mm.*
+*.ncb
+*.ndf
+*.nuget.props
+*.nuget.targets
+*.nupkg
+*.nvuser
+*.obj
+*.odx.cs
+*.opendb
+*.opensdf
+*.opt
+*.pch
+*.pdb
+*.pfx
+*.pgc
+*.pgd
+*.pidb
+*.plg
+*.psess
+*.publishproj
+*.publishsettings
+*.pubxml
+*.pyc
+*.rdl.data
+*.rptproj.bak
+*.rptproj.rsuser
+*.rsp
+*.rsuser
+*.sap
+*.sbr
+*.scc
+*.sdf
+*.sln.docstates
+*.sln.iml
+*.snupkg
+*.suo
+*.svclog
+*.tlb
+*.tlh
+*.tli
+*.tlog
+*.tmp
+*.tmp_proj
+*.tss
+*.user
+*.userosscache
+*.userprefs
+*.vbp
+*.vbw
+*.VC.db
+*.VC.VC.opendb
+*.VisualState.xml
+*.vsp
+*.vspscc
+*.vspx
+*.vssscc
+*.xsd.cs
+**/[Pp]ackages/*
+**/*.DesktopClient/GeneratedArtifacts
+**/*.DesktopClient/ModelManifest.xml
+**/*.HTMLClient/GeneratedArtifacts
+**/*.Server/GeneratedArtifacts
+**/*.Server/ModelManifest.xml
+~$*
+$tf/
+AppPackages/
+artifacts/
+ASALocalRun/
+AutoTest.Net/
+Backup*/
+BenchmarkDotNet.Artifacts/
+bld/
+BundleArtifacts/
+ClientBin/
+coverage*.info
+coverage*.json
+coverage*.xml
+csx/
+dlldata.c
+DocProject/buildhelp/
+DocProject/Help/*.hhc
+DocProject/Help/*.hhk
+DocProject/Help/*.hhp
+DocProject/Help/*.HxC
+DocProject/Help/*.HxT
+DocProject/Help/html
+DocProject/Help/Html2
+ecf/
+FakesAssemblies/
+FodyWeavers.xsd
+Generated_Code/
+healthchecksdb
+ipch/
+MigrationBackup/
+mono_crash.*
+nCrunchTemp_*
+node_modules/
+nunit-*.xml
+OpenCover/
+orleans.codegen.cs
+Package.StoreAssociation.xml
+paket-files/
+project.fragment.lock.json
+project.lock.json
+publish/
+PublishScripts/
+rcf/
+ScaffoldingReadMe.txt
+ServiceFabricBackup/
+StyleCopReport.xml
+TestResult.xml
+UpgradeLog*.htm
+UpgradeLog*.XML
+x64/
+x86/
+
+# ----------------------
+# General Archived Files
+# ----------------------
+*.7z
+*.bz2
+*.bzip
+*.bzip2
+*.deb
+*.dmg
+*.egg
+*.gem
+*.gz
+*.gzip
+*.iso
+*.jar
+*.lzma
+*.rar
+*.rpm
+*.tar
+*.tgz
+*.txz
+*.tzst
+*.xar
+*.xpi
+*.xz
+*.zip
+*.zst
+
+# -----
+# C/C++
+# -----
+.tmp_versions/
+*.a
+*.app
+*.cmd
+*.d
+*.dll
+*.dSYM/
+*.dylib
+*.elf
+*.exe
+*.exp
+*.gch
+*.hex
+*.i*86
+*.idb
+*.ko
+*.la
+*.lai
+*.lib
+*.lo
+*.map
+*.mod*
+*.o
+*.out
+*.slo
+*.so
+*.so.*
+*.su
+*.x86_64
+dkms.conf
+Mkfile.old
+Module.symvers
+modules.order
+
+# ----
+# CUDA
+# ----
+*.cubin
+*.fatbin
+*.gpu
+*.i
+*.ii
+*.ptx
+
+# --
+# Go
+# --
+.env
+*.exe~
+*.test
+go.work
+go.work.sum
+
+# ----
+# Java
+# ----
+*.class
+*.ctxt
+*.ear
+*.hprof
+*.nar
+*.tar.gz
+*.war
+hs_err_pid*
+replay_pid*
+
+# -----
+# Julia
+# -----
+*.jl.*.cov
+*.jl.cov
+*.jl.mem
+deps/build.log
+deps/deps.jl
+deps/downloads/
+deps/src/
+deps/usr/
+docs/build/
+docs/site/
+Manifest.toml
+
+# ------------------------------
+# JavaScript / Node / TypeScript
+# ------------------------------
+.cache
+.cache/
+.docusaurus
+.dynamodb/
+.env.development.local
+.env.local
+.env.production.local
+.env.test.local
+.eslintcache
+.fusebox/
+.grunt
+.lock-wscript
+.next
+.node_repl_history
+.npm
+.nuxt
+.nyc_output
+.parcel-cache
+.pnp.*
+.pnpm-debug.log*
+.rpt2_cache/
+.rts2_cache_cjs/
+.rts2_cache_es/
+.rts2_cache_umd/
+.serverless/
+.stylelintcache
+.temp
+.tern-port
+.vscode-test
+.vuepress/dist
+.yarn-integrity
+.yarn/build-state.yml
+.yarn/cache
+.yarn/install-state.gz
+.yarn/unplugged
+*.lcov
+*.pid
+*.pid.lock
+*.seed
+*.tsbuildinfo
+bower_components
+dist
+jspm_packages/
+lerna-debug.log*
+lib-cov
+logs
+npm-debug.log*
+out
+pids
+report.[0-9]*.[0-9]*.[0-9]*.[0-9]*.json
+web_modules/
+yarn-debug.log*
+yarn-error.log*
+
+# ------
+# Python
+# ------
+__pypackages__/
+.coverage
+.coverage.*
+.dmypy.json
+.eggs/
+.hypothesis/
+.installed.cfg
+.ipynb_checkpoints
+.mypy_cache/
+.nox/
+.pdm-build/
+.pdm-python
+.pdm.toml
+.pybuilder/
+.pyre/
+.pytest_cache/
+.Python
+.python-version
+.pytype/
+.ropeproject
+.scrapy
+.spyderproject
+.spyproject
+.tox/
+.venv
+.webassets-cache
+*.cover
+*.egg-info/
+*.manifest
+*.mo
+*.pot
+*.py,cover
+*.py[cod]
+*.sage.py
+*.spec
+*$py.class
+/site
+build/
+celerybeat-schedule
+celerybeat.pid
+cover/
+coverage.xml
+cython_debug/
+db.sqlite3
+db.sqlite3-journal
+develop-eggs/
+dist/
+dmypy.json
+docs/_build/
+downloads/
+eggs/
+env.bak/
+env/
+htmlcov/
+instance/
+ipython_config.py
+lib/
+lib64/
+local_settings.py
+MANIFEST
+nosetests.xml
+parts/
+pip-delete-this-directory.txt
+pip-log.txt
+profile_default/
+sdist/
+share/python-wheels/
+target/
+var/
+venv.bak/
+venv/
+wheels/
+
+# ----
+# Rust
+# ----
+**/*.rs.bk
+Cargo.lock
+debug/
+
+# -----
+# Scala
+# -----
+
+# -----
+# CMake
+# -----
+_deps
+cmake_install.cmake
+CMakeCache.txt
+CMakeFiles
+CMakeLists.txt.user
+CMakeScripts
+CMakeUserPresets.json
+compile_commands.json
+CTestTestfile.cmake
+install_manifest.txt
+Makefile
+Testing
+
+# ------
+# Gradle
+# ------
+!gradle-wrapper.jar
+!gradle-wrapper.properties
+!src/**/build/
+.classpath
+.gradle
+.gradletasknamecache
+.project
+**/build/
+gradle-app.setting
+
+# -----
+# Maven
+# -----
+.mvn/
+buildNumber.properties
+dependency-reduced-pom.xml
+pom.xml.next
+pom.xml.releaseBackup
+pom.xml.tag
+pom.xml.versionsBackup
+release.properties
+
+# ---------
+# Terraform
+# ---------
+.terraform.tfstate.lock.info
+.terraform/
+.terraformrc
+*_override.tf
+*_override.tf.json
+*.tfstate
+*.tfstate.*
+*.tfvars
+*.tfvars.json
+crash.*.log
+crash.log
+override.tf
+override.tf.json
+terraform.rc
--- a/Granite_4.1_8b-6f6fd2708e8b1ded.bpw_state
+++ b/Granite_4.1_8b-6f6fd2708e8b1ded.bpw_state
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6ab793fef9b02f0b52d04ae0a0bc046d75406ba58d9291b3439fbc5f1f0519fe
+size 99424
--- a/README.md
+++ b/README.md
@@ -0,0 +1,238 @@
+---
+base_model:
+- ibm-granite/granite-4.1-8b
+datasets:
+- eaddario/imatrix-calibration
+language:
+- en
+license:
+- apache-2.0
+pipeline_tag: text-generation
+tags:
+- gguf
+- quant
+- target_bpw
+- experimental
+---
+
+# Experimental global target bits‑per‑weight quantization of [ibm-granite/granite-4.1-8b](https://huggingface.co/ibm-granite/granite-4.1-8b)
+Using **non-standard** (forked) [LLaMA C++][llm] release [b9358][llm-rel] for quantization.
+
+Original model: [ibm-granite/granite-4.1-8b][mdl]
+
+From the original model creators:
+> [![mof-class3-qualified](https://mot.isitopen.ai/modules/mof/assets/badge_class3_qualified.png)](https://mot.isitopen.ai/model/1160)
+>
+> # Granite-4.1-8B
+>
+> **Model Summary:**
+> Granite-4.1-8B is a 8B parameter long-context instruct model finetuned from *Granite-4.1-8B-Base* using a combination of open source instruction datasets with permissive license and internally collected synthetic datasets. Granite 4.1 models have gone through an improved post-training pipeline, including supervised finetuning and reinforcement learning alignment, resulting in enhanced tool calling, instruction following, and chat capabilities.
+>
+> - **Developers:** Granite Team, IBM
+> - **HF Collection:** [Granite 4.1 Language Models HF Collection](https://huggingface.co/collections/ibm-granite/granite-41-language-models)
+> - **Technical Blog:** [Granite-4.1 Blog](https://huggingface.co/blog/ibm-granite/granite-4-1)
+> - **GitHub Repository:** [ibm-granite/granite-4.1-language-models](https://github.com/ibm-granite/granite-4.1-language-models)
+> - **Website**: [Granite Docs](https://www.ibm.com/granite/docs/) 
+> - **Release Date**: April 29th, 2026
+> - **License:** [Apache 2.0](https://www.apache.org/licenses/LICENSE-2.0)
+>
+> **Supported Languages:** 
+> English, German, Spanish, French, Japanese, Portuguese, Arabic, Czech, Italian, Korean, Dutch, and Chinese. Users may finetune Granite 4.1 models for languages beyond these languages.
+>
+> **Intended use:** 
+> The model is designed to follow general instructions and can serve as the foundation for AI assistants across diverse domains, including business applications, as well as for LLM agents equipped with tool-use capabilities.
+
+---
+
+# ⚠️ PLEASE READ THIS BEFORE USING THESE EXPERIMENTAL VERSIONS! ⚠️
+An area of personal interest is finding ways to optimize the inference performance of LLMs when deployed in resource-constrained environments like commodity hardware, desktops, laptops, mobiles, edge devices, etc. There are many approaches to accomplish this, including architecture simplification and knowledge distillation, but my focus has been primarily on quantization and pruning.
+
+The method to produce these experimental versions involves using a custom version of [`llama-imatrix`][imx] to generate an imatrix that includes tensor statistics, and a custom version of [`llama-quantize`][qtz], which computes a per-tensor quantization error, to automatically select the lowest error quantization recipe that achieves a global target bits‑per‑weight (bpw). More details on the implementation and test results [here][bpw]
+
+There are two pull requests ([#14891][imtx-pr] & [#15550][qtz-pr]) to merge these changes back into the core llama.cpp project. This may or may not ever happen so, until then, the modified versions will be available on [GitHub][gh].
+
+For testing and comparison, I use models produced by [Bartowski][btk] (see credits below) and [Unsloth][ust] ([Daniel and Michael Han][ust-ai] do some really interesting stuff!) but when they don't provide versions of the required model, tests and comparisons are against standard quantization obtained by simply running `llama-quantize` with no further optimizations.
+
+All experimental versions were generated using an appropriate imatrix created from datasets available at [eaddario/imatrix-calibration][ical]. In `llama.cpp`, an imatrix is a calibration file derived from running representative text through the model and collecting activation statistics. It is used to weight quantization error so that error in more “important” directions (as estimated from activations) is penalized more heavily.
+
+The process to generate these models is roughly as follows:
+1. Convert the original model's [safetensors][sfts] to [GGUF][ggf] F16
+2. Estimate the [Perplexity][ppl] score for the F16 model (baseline) using the [wikitext-2-raw-v1][wki-dat] dataset, and save the [logits][lgt]
+3. Generate an [imatrix][imx-dat] from the most appropriate [calibration dataset][ical]
+4. Quantize the baseline model targeting a bpw average (e.g. `llama-quantize --target-bpw 4.5678 --state-file --imatrix imatrix.gguf baseline-model-F16.gguf 12`)
+5. Calculate Perplexity, KL Divergence, ARC (Easy+Challenge), GPQA-Diamond, HellaSwag, MMLU-Redux, Truthful QA and WinoGrande scores for each quantized model
+6. Keep version with the best 𝜌PPL and μKLD scores
+7. Repeat until all desired quants are created
+
+### Misconceptions about BF16 to F16 Conversion
+A common concern when converting BFloat16 ([BF16][bf16]) models to Float16 (F16) is the potential for accuracy loss. Specifically:
+- Weight Clipping (Overflow): Clipping, or overflow, is often feared but only occurs if a model's weights exceed the range of ±65,503. This is a relatively rare issue in practice.
+- Subnormal Zeroing (Underflow): A more frequent occurrence is underflow, where weights smaller than approximately 5.96x10⁻⁸ are converted to zero.
+
+Crucially, when the F16 model is subsequently used for quantization, the resulting degradation in metrics like Perplexity ([PPL][ppl]) or Kullback–Leibler Divergence ([KLD][kld]) is minimal. Any variations are typically restricted to the hundreds or thousandths decimal places compared to the BF16 model.
+
+However, considering that weight clipping presents a more substantial risk to model integrity, every BF16 base model undergoes validation prior to the conversion process. Consequently, no models hosted in this repository exhibit performance degradation due to overflow clipping.
+
+While BF16 offers precision benefits, performance remains a key factor.
+- Conversion Speed: Tests, such as timing `convert_hf_to_gguf.py`, show a notable performance difference, with conversion to BF16 being 15–30% slower than to F16.
+- Inference Speed: A less pronounced but still present difference (3–6%) is observed during inference. Although native BF support has been introduced by many chip manufacturers, the slower performance **may** stem from the entire software and hardware stack (firmware, libraries, etc.) not being fully optimized yet.
+
+The choice to prioritize F16 over BF16 is driven by a focus on maximizing performance in specific deployment environments. My primary objective is not large-scale quantization production, a domain where others like [Bartowski][btk] and [Unsloth][ust] excel at, but rather optimizing inference performance for resource-constrained environments. Since BF16 support is not yet widespread in areas like mobile, edge, and embedded devices, using F16 ensures broader compatibility and easier optimization for these use cases.
+
+# Advantages and disadvantages of the global target bits‑per‑weight quantization process
+### Advantages
+1. **Target arbitrary size models**
+    - When specifying `--target-bpw 4.5678` for instance, the algorithm will produce a model (nearly) exactly of that size, which is very useful for maximizing VRAM usage. In a system with 24GB VRAM and a 70B model, standard quants might produce a 16.8GB file (too small, quality left on table) or a 24.1GB file (won't fit). This approach can generate a 23.85GB file to utilize the hardware fully.
+
+2. **Data-driven mixed precision often can improve quality at fixed size**
+    - Instead of using hardcoded heuristics (e.g. make `attn_v` Q5_K for a 70B model), that may be sub‑optimal for a given architecture or size, the quantization mix is determined by the actual error sensitivity of the specific model's weights. This, in practice, often yields a better quality/size trade-off, especially in aggressive quantization scenarios (1.5 to 3.5 bpw), or for unusual architectures.
+
+    - **Please note**: `llama.cpp`’s heuristics have been tuned across many models and are highly optimized; although the target bpw method produces better quality often (>75% based on tests with 130 models from 11 different families), it can also lose in surprising cases.
+
+3. **Allows better like-for-like comparisons between models and families**
+    - Standard `llama.cpp` quantization uses hardcoded rules like: *"use Q4_K_M, except bump some tensors up/down, except fall back if incompatible, except keep some tensors unquantized..."* and for that reason, two different models quantized with the same Q4_K_M type can end up with very different bpw (e.g. 4.75 and 4.30).
+
+    - All things being equal, the performance of a model is usually proportional to its overall bpw size; models with a higher bpw tend to perform better than lower bpw models. Since model A has simply been given more bits, it will typically perform better (lower perplexity, better eval scores, etc.) even if the underlying quantization method is identical. That makes comparing the performance not a controlled experiment, because the comparison is between models with different effective compression ratios.
+
+    - `--target-bpw` tries to address that by making the experiment more controlled: each model gets quantized to land on (approximately) the same global byte budget, so that the models' performance differences are more attributable to architecture/training differences, quantization error behaviour at the same compression ratio, optimizer’s allocation decisions, etc.
+
+### Disadvantages
+1. **Quantization process is significantly slower than standard**
+    - This approach can take 5x-10x longer as it quantizes a sample of most tensors into 15 different formats, dequantizes them back to floats, computes error diffs, and selects the best size/error option that fits the global bpw budget.
+
+    - However, the `--state-file` option will save/use the above-mentioned computations so that future quantizations, for the same model, can be generated at normal speed. It also allows to interrupt the computation process and resume it at a later time.
+
+2. **The optimization target is only a proxy for the model's performance quality**
+    - The process minimizes a per-tensor estimated error computed from sampled rows, not actual perplexity or divergence of output distributions (a future version may address this). Since errors interact nonlinearly across layers, there are no guarantees it will select the best possible quantization recipe subject to the bpw size constraint.
+
+3. **An imatrix with activations data is required for best results**
+    - Activation data is required to compute the bias factor (i.e. the systematic error projected onto activation directions). If the imatrix file does not contain activation data, the `--target-bpw` option will refuse to run.
+
+---
+
+# Models
+### Bits per weight, size, perplexity and KL Divergence scores
+| Model                                             |     BPW | Size (GB) |                μPPL |   𝜌PPL |               μKLD |    Same Top-P |
+| ------------------------------------------------- | ------: | --------: | ------------------: | -----: | -----------------: | ------------: |
+| [granite-4.1-8b-F16](./granite-4.1-8b-F16.gguf)   | 16.0006 |      17.6 |  8.691178 ±0.065443 |   100% |                N/A |           N/A |
+| [granite-4.1-8b-Q2_K](./granite-4.1-8b-Q1_L.gguf) |  1.7500 |      1.93 | 87.318832 ±0.781580 | 57.61% | 2.889523 ±0.005948 | 34.309 ±0.125 |
+| [granite-4.1-8b-Q2_K](./granite-4.1-8b-Q2_K.gguf) |  2.5000 |      2.75 | 12.534216 ±0.095606 | 86.12% | 0.644965 ±0.002755 | 67.231 ±0.124 |
+| [granite-4.1-8b-Q3_K](./granite-4.1-8b-Q3_K.gguf) |  3.5000 |      3.85 |  9.381594 ±0.070128 | 96.18% | 0.173887 ±0.001079 | 82.732 ±0.100 |
+| [granite-4.1-8b-Q4_K](./granite-4.1-8b-Q4_K.gguf) |  4.4999 |      4.95 |  8.867438 ±0.067303 | 98.88% | 0.047917 ±0.000392 | 90.937 ±0.076 |
+| [granite-4.1-8b-Q5_K](./granite-4.1-8b-Q5_K.gguf) |  5.4999 |      6.05 |  8.766150 ±0.066421 | 99.48% | 0.018940 ±0.000165 | 94.120 ±0.062 |
+| [granite-4.1-8b-Q6_K](./granite-4.1-8b-Q6_K.gguf) |  6.4998 |      7.15 |  8.755199 ±0.066400 | 99.74% | 0.007326 ±0.000066 | 96.165 ±0.051 |
+| [granite-4.1-8b-Q7_K](./granite-4.1-8b-Q7_K.gguf) |  7.4998 |      8.25 |  8.751241 ±0.066500 | 99.82% | 0.003568 ±0.000040 | 97.235 ±0.043 |
+| [granite-4.1-8b-Q8_0](./granite-4.1-8b-Q8_0.gguf) |  8.4988 |      9.34 |  8.749119 ±0.066517 | 99.85% | 0.002052 ±0.000024 | 97.749 ±0.039 |
+
+### ARC, GPQA-Diamond, HellaSwag, MMLU-Redux, Truthful QA, and WinoGrande scores
+Scores generated using [llama-perplexity][ppl] with 750 tasks per test, and a context size of 1024 tokens.
+
+For the test data used in the generation of these scores, follow the appropriate links: [ARC Challenge, Truthful QA][tst-dat], [GPQA-Diamond][gpqa-dat], [HellaSwag][hsw-tst], [MMLU-Redux][mrdx], [WinoGrande][wng-tst]
+
+| Model                                             |   ARC Challenge |    GPQA-Diamond | HellaSwag |      MMLU-Redox |     Truthful QA |      WinoGrande | Avg Score |
+| ------------------------------------------------- | --------------: | --------------: | --------: | --------------: | --------------: | --------------: | --------: |
+| [granite-4.1-8b-Q1_L](./granite-4.1-8b-Q1_L.gguf) | 36.5333 ±1.7594 | 19.1919 ±2.8058 |     36.00 | 27.2000 ±1.6260 | 28.9333 ±1.6569 | 52.5333 ±1.8246 |     33.40 |
+| [granite-4.1-8b-Q2_K](./granite-4.1-8b-Q2_K.gguf) | 60.4000 ±1.7870 | 29.7980 ±3.2586 |     70.00 | 59.2000 ±1.7958 | 33.4667 ±1.7242 | 65.2000 ±1.7405 |     53.01 |
+| [granite-4.1-8b-Q3_K](./granite-4.1-8b-Q3_K.gguf) | 62.0000 ±1.7736 | 21.7172 ±2.9377 |     79.33 | 69.2000 ±1.6869 | 39.6000 ±1.7870 | 71.7333 ±1.6453 |     57.26 |
+| [granite-4.1-8b-Q4_K](./granite-4.1-8b-Q4_K.gguf) | 66.9333 ±1.7190 | 23.2323 ±3.0089 |     79.73 | 71.4667 ±1.6500 | 38.9333 ±1.7816 | 73.4667 ±1.6132 |     58.96 |
+| [granite-4.1-8b-Q5_K](./granite-4.1-8b-Q5_K.gguf) | 66.4000 ±1.7259 | 22.7273 ±2.9858 |     79.87 | 72.1333 ±1.6382 | 38.5333 ±1.7783 | 73.4667 ±1.6132 |     58.86 |
+| [granite-4.1-8b-Q6_K](./granite-4.1-8b-Q6_K.gguf) | 67.0667 ±1.7172 | 24.7475 ±3.0746 |     80.13 | 72.6667 ±1.6284 | 38.2667 ±1.7759 | 73.7333 ±1.6080 |     59.44 |
+| [granite-4.1-8b-Q7_K](./granite-4.1-8b-Q7_K.gguf) | 66.4000 ±1.7259 | 26.7677 ±3.1544 |     80.27 | 72.1333 ±1.6382 | 38.5333 ±1.7783 | 73.6000 ±1.6106 |     59.62 |
+| [granite-4.1-8b-Q8_0](./granite-4.1-8b-Q8_0.gguf) | 66.8000 ±1.7207 | 26.7677 ±3.1544 |     80.53 | 72.4000 ±1.6334 | 38.4000 ±1.7771 | 73.2000 ±1.6184 |     59.68 |
+
+### Tokens per second benchmarks
+Scores generated using [llama-bench][bch]. Standard (`llama-quantize` with no optimization) Q4_K_M quantization included for comparison.
+
+| model                                             |     size | params | backend  | threads |          test |           t/s |
+| ------------------------------------------------- | -------: | -----: | -------- | ------: | ------------: | ------------: |
+| [granite-4.1-8b-Q1_L](./granite-4.1-8b-Q1_L.gguf) | 1.79 GiB | 8.79 B | BLAS,MTL |      12 |         pp512 |  783.11 ±0.52 |
+| [granite-4.1-8b-Q1_L](./granite-4.1-8b-Q1_L.gguf) | 1.79 GiB | 8.79 B | BLAS,MTL |      12 |         tg128 |   68.68 ±0.17 |
+| [granite-4.1-8b-Q1_L](./granite-4.1-8b-Q1_L.gguf) | 1.79 GiB | 8.79 B | BLAS,MTL |      12 | pp1024+tg1024 |  108.35 ±1.28 |
+| [granite-4.1-8b-Q2_K](./granite-4.1-8b-Q2_K.gguf) | 2.56 GiB | 8.79 B | BLAS,MTL |      12 |         pp512 | 728.97 ±10.22 |
+| [granite-4.1-8b-Q2_K](./granite-4.1-8b-Q2_K.gguf) | 2.56 GiB | 8.79 B | BLAS,MTL |      12 |         tg128 |   68.76 ±0.21 |
+| [granite-4.1-8b-Q2_K](./granite-4.1-8b-Q2_K.gguf) | 2.56 GiB | 8.79 B | BLAS,MTL |      12 | pp1024+tg1024 |  108.98 ±0.24 |
+| [granite-4.1-8b-Q3_K](./granite-4.1-8b-Q3_K.gguf) | 3.58 GiB | 8.79 B | BLAS,MTL |      12 |         pp512 |  733.45 ±9.51 |
+| [granite-4.1-8b-Q3_K](./granite-4.1-8b-Q3_K.gguf) | 3.58 GiB | 8.79 B | BLAS,MTL |      12 |         tg128 |   63.63 ±1.20 |
+| [granite-4.1-8b-Q3_K](./granite-4.1-8b-Q3_K.gguf) | 3.58 GiB | 8.79 B | BLAS,MTL |      12 | pp1024+tg1024 |   94.51 ±1.15 |
+| [granite-4.1-8b-Q4_K](./granite-4.1-8b-Q4_K.gguf) | 4.61 GiB | 8.79 B | BLAS,MTL |      12 |         pp512 |  771.63 ±0.97 |
+| [granite-4.1-8b-Q4_K](./granite-4.1-8b-Q4_K.gguf) | 4.61 GiB | 8.79 B | BLAS,MTL |      12 |         tg128 |   66.33 ±1.24 |
+| [granite-4.1-8b-Q4_K](./granite-4.1-8b-Q4_K.gguf) | 4.61 GiB | 8.79 B | BLAS,MTL |      12 | pp1024+tg1024 |  105.98 ±4.76 |
+| [granite-4.1-8b-Q5_K](./granite-4.1-8b-Q5_K.gguf) | 5.63 GiB | 8.79 B | BLAS,MTL |      12 |         pp512 | 673.26 ±34.19 |
+| [granite-4.1-8b-Q5_K](./granite-4.1-8b-Q5_K.gguf) | 5.63 GiB | 8.79 B | BLAS,MTL |      12 |         tg128 |   51.29 ±3.09 |
+| [granite-4.1-8b-Q5_K](./granite-4.1-8b-Q5_K.gguf) | 5.63 GiB | 8.79 B | BLAS,MTL |      12 | pp1024+tg1024 |   83.45 ±2.31 |
+| [granite-4.1-8b-Q6_K](./granite-4.1-8b-Q6_K.gguf) | 6.65 GiB | 8.79 B | BLAS,MTL |      12 |         pp512 | 703.41 ±23.92 |
+| [granite-4.1-8b-Q6_K](./granite-4.1-8b-Q6_K.gguf) | 6.65 GiB | 8.79 B | BLAS,MTL |      12 |         tg128 |   52.12 ±1.38 |
+| [granite-4.1-8b-Q6_K](./granite-4.1-8b-Q6_K.gguf) | 6.65 GiB | 8.79 B | BLAS,MTL |      12 | pp1024+tg1024 |   87.04 ±0.22 |
+| [granite-4.1-8b-Q7_K](./granite-4.1-8b-Q7_K.gguf) | 7.68 GiB | 8.79 B | BLAS,MTL |      12 |         pp512 |  614.53 ±0.48 |
+| [granite-4.1-8b-Q7_K](./granite-4.1-8b-Q7_K.gguf) | 7.68 GiB | 8.79 B | BLAS,MTL |      12 |         tg128 |   49.47 ±0.59 |
+| [granite-4.1-8b-Q7_K](./granite-4.1-8b-Q7_K.gguf) | 7.68 GiB | 8.79 B | BLAS,MTL |      12 | pp1024+tg1024 |   83.45 ±0.24 |
+| [granite-4.1-8b-Q8_0](./granite-4.1-8b-Q8_0.gguf) | 8.70 GiB | 8.79 B | BLAS,MTL |      12 |         pp512 |  800.32 ±0.73 |
+| [granite-4.1-8b-Q8_0](./granite-4.1-8b-Q8_0.gguf) | 8.70 GiB | 8.79 B | BLAS,MTL |      12 |         tg128 |   46.66 ±0.04 |
+| [granite-4.1-8b-Q8_0](./granite-4.1-8b-Q8_0.gguf) | 8.70 GiB | 8.79 B | BLAS,MTL |      12 | pp1024+tg1024 |   77.87 ±0.30 |
+
+# Metrics used
+**[Perplexity][ppx]:** one of the key metrics used in NLP evaluation. It measures the quality of a language model by evaluating how well it predicts the next token given a particular sequence of words. A PPL of **1** indicates an exact match between predicted and actual, whereas values greater than one indicate a degree of "surprise" the generated token differs from the expected.
+
+**[Kullback–Leibler (KL) Divergence][kld]:** a statistical measure of how much a probability distribution differs from another. When quantizing models (or altering the original tensors in any way for that matter), the closest we can preserve the weights' probability distribution to the original model the better, thus the closest to **0** the better.
+
+**[AI2 Reasoning Challenge (ARC)][arc]:** a benchmark to evaluate the ability of AI models to answer complex science questions that require logical reasoning beyond pattern matching.
+
+**[GPQA-Diamond][gpqa]:** a challenging dataset of 448 multiple-choice questions written by domain experts in biology, physics, and chemistry.
+
+**[HellaSwag][hsw]:** the Harder Endings, Longer contexts, and Low-shot Activities for Situations With Adversarial Generations (bit of a mouthful!) is a benchmark designed to test commonsense natural language inference. It requires the model to predict the most likely ending of a sentence.
+
+**[MMLU][mmlu]:** the Massive Multitask Language Understanding evaluates LLMs’ general knowledge and problem-solving abilities across 57 subjects, including elementary mathematics, US history, computer science, and law.
+
+**[Truthful QA][tqa]:** evaluates how well LLMs generate truthful responses to questions. It identifies whether AI models can avoid generating false or misleading information, particularly in areas where human knowledge is prone to misconceptions.
+
+**[Winogrande][wng]:** based on the [Winograd Schema Challenge][wng-chl], is a natural language understanding task requiring models to resolve ambiguities in sentences involving pronoun references.
+
+## Credits
+[LLaMa C++][llm] has a large and vibrant community of [contributors][llm-ctt] (~1,600 last time I checked) that actively maintain and extend its functionality, adding new models and architectures almost as fast as they appear. Considering the breakneck speed at which the AI/ML field is advancing, this alone is a remarkable feat!
+
+While I'm grateful to all contributors, I want to recognise three in particular:
+* [Colin Kealty][btk] (Bartowski), for the many contributions and for being one of the best sources of high quality quantized models available on Hugging Face
+* [Georgi Gerganov][ggg] for his amazing work with **llama.cpp** and the **ggml/gguf** libraries
+* [Iwan Kawrakow][ikk] for being one of the key authors behind the many quantization algorithms and the imatrix functionality.
+
+[arc]:      https://llm-stats.com/benchmarks/ai2-reasoning-challenge-(arc)
+[base]:     https://huggingface.co/ibm-granite/granite-4.1-8b
+[b-q4km]:   https://huggingface.co/bartowski
+[bch]:      https://github.com/ggml-org/llama.cpp/tree/master/tools/llama-bench
+[bf16]:     https://en.wikipedia.org/wiki/Bfloat16_floating-point_format
+[bpw]:      https://github.com/ggml-org/llama.cpp/discussions/18531
+[btk]:      https://huggingface.co/bartowski
+[ggf]:      https://huggingface.co/docs/hub/en/gguf
+[ggg]:      https://github.com/ggerganov
+[gh]:       https://github.com/EAddario/llama.cpp/tree/master
+[gpqa]:     https://arxiv.org/abs/2311.12022
+[gpqa-dat]: https://huggingface.co/datasets/eaddario/benchmark
+[hsw-tst]:  https://github.com/klosax/hellaswag_text_data
+[hsw]:      https://rowanzellers.com/hellaswag
+[ical]:     https://huggingface.co/datasets/eaddario/imatrix-calibration
+[ikk]:      https://github.com/ikawrakow
+[imtx-pr]:  https://github.com/ggml-org/llama.cpp/pull/14891
+[imx-dat]:  https://huggingface.co/eaddario/granite-4.1-8b-GGUF/tree/main/imatrix
+[imx]:      https://github.com/EAddario/llama.cpp/tree/imatrix
+[kld]:      https://en.wikipedia.org/wiki/Kullback–Leibler_divergence
+[lgt]:      https://huggingface.co/eaddario/granite-4.1-8b-GGUF/tree/main/logits
+[llm-ctt]:  https://github.com/ggml-org/llama.cpp/graphs/contributors
+[llm-rel]:  https://github.com/ggml-org/llama.cpp/releases/tag/b9358
+[llm]:      https://github.com/ggerganov/llama.cpp
+[mdl]:      https://huggingface.co/ibm-granite/granite-4.1-8b
+[mmlu]:     https://en.wikipedia.org/wiki/MMLU
+[mrdx]:     https://huggingface.co/datasets/Green-Sky/mmlu-redux-2.0-for-llama.cpp
+[ppl]:      https://github.com/ggml-org/llama.cpp/tree/master/tools/perplexity
+[ppx]:      https://huggingface.co/docs/transformers/en/perplexity
+[qtz-pr]:   https://github.com/ggml-org/llama.cpp/pull/15550
+[qtz]:      https://github.com/EAddario/llama.cpp/tree/quantize
+[sfts]:     https://huggingface.co/docs/safetensors/en/index
+[tqa]:      https://github.com/sylinrl/TruthfulQA
+[tst-dat]:  https://huggingface.co/datasets/ikawrakow/validation-datasets-for-llama.cpp/tree/main
+[u-q4km]:   https://huggingface.co/unsloth
+[ust-ai]:   https://unsloth.ai
+[ust]:      https://huggingface.co/unsloth
+[wki-dat]:  https://huggingface.co/datasets/Salesforce/wikitext/tree/main/wikitext-2-raw-v1
+[wng-chl]:  https://cdn.aaai.org/ocs/4492/4492-21843-1-PB.pdf
+[wng-tst]:  https://huggingface.co/datasets/ikawrakow/winogrande-eval-for-llama.cpp/tree/main
+[wng]:      https://winogrande.allenai.org
--- a/granite-4.1-8b-F16.gguf
+++ b/granite-4.1-8b-F16.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:041a4adb5827786916837f193e624ac4fced3e7c0eb9458708f8e39a50c80640
+size 17587417856
--- a/granite-4.1-8b-Q1_L.gguf
+++ b/granite-4.1-8b-Q1_L.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4dc3864de95c7f4d5568718625e58cf54d4046545d2bf397eb80970f0bfc7487
+size 1926722560
--- a/granite-4.1-8b-Q2_K.gguf
+++ b/granite-4.1-8b-Q2_K.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c149301db1c2da459842becd06edee4d695bdaa98ab19b2e72a8e77dca283a6f
+size 2750919680
--- a/granite-4.1-8b-Q3_K.gguf
+++ b/granite-4.1-8b-Q3_K.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:60b1874b8af548c0e7e265e025a1c0847afce50529defa47e090b2930cc0f2c1
+size 3849876480
--- a/granite-4.1-8b-Q4_K.gguf
+++ b/granite-4.1-8b-Q4_K.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2253b2e0b33a5ae20ea3acfe4e2a0cc44e1ead7ca440997db710afc1f2e63005
+size 4948784128
--- a/granite-4.1-8b-Q5_K.gguf
+++ b/granite-4.1-8b-Q5_K.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:00f2df50b6bdb0b2e6c510f71cb502192b5271e55880f8a2a44a9d6736c5813d
+size 6047708160
--- a/granite-4.1-8b-Q6_K.gguf
+++ b/granite-4.1-8b-Q6_K.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:292a55c8ffd7ae6daf0db87a4399c70ed557158766a17f21ae528ab6bf10a222
+size 7146566656
--- a/granite-4.1-8b-Q7_K.gguf
+++ b/granite-4.1-8b-Q7_K.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1a6e17af4482a0358522d65c8f0776605bdc565beaeefe998cb3975ef06a722d
+size 8245441536
--- a/granite-4.1-8b-Q8_0.gguf
+++ b/granite-4.1-8b-Q8_0.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7dcd5c8a7650336bdce6628d5e7645d33f73c0a3da6a679251d9b48d624a66d2
+size 9343267840
--- a/imatrix/imatrix-granite-4.1-8b-medium.gguf
+++ b/imatrix/imatrix-granite-4.1-8b-medium.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:884c70cf05568063f8e14655e063ead2ad52546f1421caab3a4ad0b4cc648601
+size 12054912
--- a/logits/granite-4.1-8b.logits
+++ b/logits/granite-4.1-8b.logits
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:57a822d9464e7d5cf600bf914065cb083783e20355f566609d0e2e0059b13e4f
+size 28905288788
--- a/scores/granite-4.1-8b-Q1_L.md
+++ b/scores/granite-4.1-8b-Q1_L.md
--- a/scores/granite-4.1-8b-Q2_K.md
+++ b/scores/granite-4.1-8b-Q2_K.md
--- a/scores/granite-4.1-8b-Q3_K.md
+++ b/scores/granite-4.1-8b-Q3_K.md
--- a/scores/granite-4.1-8b-Q4_K.md
+++ b/scores/granite-4.1-8b-Q4_K.md
--- a/scores/granite-4.1-8b-Q5_K.md
+++ b/scores/granite-4.1-8b-Q5_K.md
--- a/scores/granite-4.1-8b-Q6_K.md
+++ b/scores/granite-4.1-8b-Q6_K.md
--- a/scores/granite-4.1-8b-Q7_K.md
+++ b/scores/granite-4.1-8b-Q7_K.md
--- a/scores/granite-4.1-8b-Q8_0.md
+++ b/scores/granite-4.1-8b-Q8_0.md
--- a/scores/granite-4.1-8b-q1_l.arc
+++ b/scores/granite-4.1-8b-q1_l.arc
@@ -0,0 +1,18 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q1_L.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:    2 tensors
+llama_model_loader: - type iq2_xxs:    1 tensors
+llama_model_loader: - type iq2_xs:   22 tensors
+llama_model_loader: - type iq1_s:  209 tensors
+llama_model_loader: - type iq2_s:   17 tensors
+llama_model_loader: - type iq1_m:   31 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ1_M - 1.75 bpw
+print_info: file size   = 1.79 GiB (1.75 BPW) 
+
+multiple_choice_score: there are 869 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 869 tasks available
+multiple_choice_score : calculating ARC Challenge score over 750 tasks.
+
+Final result: 36.5333 +/- 1.7594
+Random chance: 25.0083 +/- 1.5824
--- a/scores/granite-4.1-8b-q1_l.gpqa
+++ b/scores/granite-4.1-8b-q1_l.gpqa
@@ -0,0 +1,18 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q1_L.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:    2 tensors
+llama_model_loader: - type iq2_xxs:    1 tensors
+llama_model_loader: - type iq2_xs:   22 tensors
+llama_model_loader: - type iq1_s:  209 tensors
+llama_model_loader: - type iq2_s:   17 tensors
+llama_model_loader: - type iq1_m:   31 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ1_M - 1.75 bpw
+print_info: file size   = 1.79 GiB (1.75 BPW) 
+
+multiple_choice_score: there are 198 tasks in prompt
+multiple_choice_score: reading tasks......................................................................................................................................................................................................done
+multiple_choice_score : calculating GPQA-Diamond score over 198 tasks.
+
+Final result: 19.1919 +/- 2.8058
+Random chance: 24.5963 +/- 3.0683
--- a/scores/granite-4.1-8b-q1_l.hsw
+++ b/scores/granite-4.1-8b-q1_l.hsw
@@ -0,0 +1,17 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q1_L.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:    2 tensors
+llama_model_loader: - type iq2_xxs:    1 tensors
+llama_model_loader: - type iq2_xs:   22 tensors
+llama_model_loader: - type iq1_s:  209 tensors
+llama_model_loader: - type iq2_s:   17 tensors
+llama_model_loader: - type iq1_m:   31 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ1_M - 1.75 bpw
+print_info: file size   = 1.79 GiB (1.75 BPW) 
+
+hellaswag_score : loaded 10042 tasks from prompt.
+hellaswag_score : selecting 750 randomized tasks.
+hellaswag_score : calculating hellaswag score over selected tasks.
+
+750	36.00000000%	[32.6441%, 39.4986%]
--- a/scores/granite-4.1-8b-q1_l.mmlu
+++ b/scores/granite-4.1-8b-q1_l.mmlu
@@ -0,0 +1,18 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q1_L.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:    2 tensors
+llama_model_loader: - type iq2_xxs:    1 tensors
+llama_model_loader: - type iq2_xs:   22 tensors
+llama_model_loader: - type iq1_s:  209 tensors
+llama_model_loader: - type iq2_s:   17 tensors
+llama_model_loader: - type iq1_m:   31 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ1_M - 1.75 bpw
+print_info: file size   = 1.79 GiB (1.75 BPW) 
+
+multiple_choice_score: there are 5362 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 5362 tasks available
+multiple_choice_score : calculating MMLU-Redux score over 750 tasks.
+
+Final result: 27.2000 +/- 1.6260
+Random chance: 25.0000 +/- 1.5822
--- a/scores/granite-4.1-8b-q1_l.ppx
+++ b/scores/granite-4.1-8b-q1_l.ppx
@@ -0,0 +1,52 @@
+Will perform strided perplexity calculation -> adjusting context size from 3072 to 3264
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q1_L.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:    2 tensors
+llama_model_loader: - type iq2_xxs:    1 tensors
+llama_model_loader: - type iq2_xs:   22 tensors
+llama_model_loader: - type iq1_s:  209 tensors
+llama_model_loader: - type iq2_s:   17 tensors
+llama_model_loader: - type iq1_m:   31 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ1_M - 1.75 bpw
+print_info: file size   = 1.79 GiB (1.75 BPW) 
+
+====== Perplexity statistics ======
+Mean PPL(Q)                   :  87.318832 ±   0.781580
+Mean PPL(base)                :   8.691178 ±   0.065443
+Cor(ln(PPL(Q)), ln(PPL(base))):  57.61%
+Mean ln(PPL(Q)/PPL(base))     :   2.307258 ±   0.007692
+Mean PPL(Q)/PPL(base)         :  10.046835 ±   0.077278
+Mean PPL(Q)-PPL(base)         :  78.627654 ±   0.745801
+
+====== KL divergence statistics ======
+Mean    KLD:   2.889523 ±   0.005948
+Maximum KLD:  18.836405
+99.9%   KLD:  13.080500
+99.0%   KLD:  10.150911
+95.0%   KLD:   7.400433
+90.0%   KLD:   6.028920
+Median  KLD:   2.342337
+10.0%   KLD:   0.519454
+ 5.0%   KLD:   0.230382
+ 1.0%   KLD:   0.035005
+ 0.1%   KLD:   0.005322
+Minimum KLD:   0.000491
+
+====== Token probability statistics ======
+Mean    Δp: -31.301 ± 0.094 %
+Maximum Δp: 92.012%
+99.9%   Δp: 58.470%
+99.0%   Δp: 27.386%
+95.0%   Δp:  4.750%
+90.0%   Δp:  0.243%
+75.0%   Δp: -0.866%
+Median  Δp: -17.956%
+25.0%   Δp: -60.731%
+10.0%   Δp: -90.577%
+ 5.0%   Δp: -97.636%
+ 1.0%   Δp: -99.874%
+ 0.1%   Δp: -99.991%
+Minimum Δp: -100.000%
+RMS Δp    : 47.467 ± 0.088 %
+Same top p: 34.309 ± 0.125 %
--- a/scores/granite-4.1-8b-q1_l.tqa
+++ b/scores/granite-4.1-8b-q1_l.tqa
@@ -0,0 +1,18 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q1_L.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:    2 tensors
+llama_model_loader: - type iq2_xxs:    1 tensors
+llama_model_loader: - type iq2_xs:   22 tensors
+llama_model_loader: - type iq1_s:  209 tensors
+llama_model_loader: - type iq2_s:   17 tensors
+llama_model_loader: - type iq1_m:   31 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ1_M - 1.75 bpw
+print_info: file size   = 1.79 GiB (1.75 BPW) 
+
+multiple_choice_score: there are 817 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 817 tasks available
+multiple_choice_score : calculating TruthfulQA score over 750 tasks.
+
+Final result: 28.9333 +/- 1.6569
+Random chance: 19.8992 +/- 1.4588
--- a/scores/granite-4.1-8b-q1_l.wng
+++ b/scores/granite-4.1-8b-q1_l.wng
@@ -0,0 +1,16 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q1_L.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:    2 tensors
+llama_model_loader: - type iq2_xxs:    1 tensors
+llama_model_loader: - type iq2_xs:   22 tensors
+llama_model_loader: - type iq1_s:  209 tensors
+llama_model_loader: - type iq2_s:   17 tensors
+llama_model_loader: - type iq1_m:   31 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ1_M - 1.75 bpw
+print_info: file size   = 1.79 GiB (1.75 BPW) 
+
+winogrande_score : loaded 1266 tasks from prompt.
+winogrande_score : selecting 750 random tasks
+
+Final Winogrande score(750 tasks): 52.5333 +/- 1.8246
--- a/scores/granite-4.1-8b-q2_k.arc
+++ b/scores/granite-4.1-8b-q2_k.arc
@@ -0,0 +1,21 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q2_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:   35 tensors
+llama_model_loader: - type q3_K:    1 tensors
+llama_model_loader: - type iq2_xxs:   41 tensors
+llama_model_loader: - type iq2_xs:   56 tensors
+llama_model_loader: - type iq3_xxs:    6 tensors
+llama_model_loader: - type iq1_s:    2 tensors
+llama_model_loader: - type iq3_s:   38 tensors
+llama_model_loader: - type iq2_s:   99 tensors
+llama_model_loader: - type iq1_m:    4 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ2_S - 2.5 bpw
+print_info: file size   = 2.56 GiB (2.50 BPW) 
+
+multiple_choice_score: there are 869 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 869 tasks available
+multiple_choice_score : calculating ARC Challenge score over 750 tasks.
+
+Final result: 60.4000 +/- 1.7870
+Random chance: 25.0083 +/- 1.5824
--- a/scores/granite-4.1-8b-q2_k.gpqa
+++ b/scores/granite-4.1-8b-q2_k.gpqa
@@ -0,0 +1,21 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q2_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:   35 tensors
+llama_model_loader: - type q3_K:    1 tensors
+llama_model_loader: - type iq2_xxs:   41 tensors
+llama_model_loader: - type iq2_xs:   56 tensors
+llama_model_loader: - type iq3_xxs:    6 tensors
+llama_model_loader: - type iq1_s:    2 tensors
+llama_model_loader: - type iq3_s:   38 tensors
+llama_model_loader: - type iq2_s:   99 tensors
+llama_model_loader: - type iq1_m:    4 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ2_S - 2.5 bpw
+print_info: file size   = 2.56 GiB (2.50 BPW) 
+
+multiple_choice_score: there are 198 tasks in prompt
+multiple_choice_score: reading tasks......................................................................................................................................................................................................done
+multiple_choice_score : calculating GPQA-Diamond score over 198 tasks.
+
+Final result: 29.7980 +/- 3.2586
+Random chance: 24.5963 +/- 3.0683
--- a/scores/granite-4.1-8b-q2_k.hsw
+++ b/scores/granite-4.1-8b-q2_k.hsw
@@ -0,0 +1,20 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q2_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:   35 tensors
+llama_model_loader: - type q3_K:    1 tensors
+llama_model_loader: - type iq2_xxs:   41 tensors
+llama_model_loader: - type iq2_xs:   56 tensors
+llama_model_loader: - type iq3_xxs:    6 tensors
+llama_model_loader: - type iq1_s:    2 tensors
+llama_model_loader: - type iq3_s:   38 tensors
+llama_model_loader: - type iq2_s:   99 tensors
+llama_model_loader: - type iq1_m:    4 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ2_S - 2.5 bpw
+print_info: file size   = 2.56 GiB (2.50 BPW) 
+
+hellaswag_score : loaded 10042 tasks from prompt.
+hellaswag_score : selecting 750 randomized tasks.
+hellaswag_score : calculating hellaswag score over selected tasks.
+
+750	70.00000000%	[66.6252%, 73.1710%]
--- a/scores/granite-4.1-8b-q2_k.mmlu
+++ b/scores/granite-4.1-8b-q2_k.mmlu
@@ -0,0 +1,21 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q2_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:   35 tensors
+llama_model_loader: - type q3_K:    1 tensors
+llama_model_loader: - type iq2_xxs:   41 tensors
+llama_model_loader: - type iq2_xs:   56 tensors
+llama_model_loader: - type iq3_xxs:    6 tensors
+llama_model_loader: - type iq1_s:    2 tensors
+llama_model_loader: - type iq3_s:   38 tensors
+llama_model_loader: - type iq2_s:   99 tensors
+llama_model_loader: - type iq1_m:    4 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ2_S - 2.5 bpw
+print_info: file size   = 2.56 GiB (2.50 BPW) 
+
+multiple_choice_score: there are 5362 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 5362 tasks available
+multiple_choice_score : calculating MMLU-Redux score over 750 tasks.
+
+Final result: 59.2000 +/- 1.7958
+Random chance: 25.0000 +/- 1.5822
--- a/scores/granite-4.1-8b-q2_k.ppx
+++ b/scores/granite-4.1-8b-q2_k.ppx
@@ -0,0 +1,55 @@
+Will perform strided perplexity calculation -> adjusting context size from 3072 to 3264
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q2_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:   35 tensors
+llama_model_loader: - type q3_K:    1 tensors
+llama_model_loader: - type iq2_xxs:   41 tensors
+llama_model_loader: - type iq2_xs:   56 tensors
+llama_model_loader: - type iq3_xxs:    6 tensors
+llama_model_loader: - type iq1_s:    2 tensors
+llama_model_loader: - type iq3_s:   38 tensors
+llama_model_loader: - type iq2_s:   99 tensors
+llama_model_loader: - type iq1_m:    4 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ2_S - 2.5 bpw
+print_info: file size   = 2.56 GiB (2.50 BPW) 
+
+====== Perplexity statistics ======
+Mean PPL(Q)                   :  12.534216 ±   0.095606
+Mean PPL(base)                :   8.691178 ±   0.065443
+Cor(ln(PPL(Q)), ln(PPL(base))):  86.12%
+Mean ln(PPL(Q)/PPL(base))     :   0.366154 ±   0.003993
+Mean PPL(Q)/PPL(base)         :   1.442177 ±   0.005759
+Mean PPL(Q)-PPL(base)         :   3.843038 ±   0.051440
+
+====== KL divergence statistics ======
+Mean    KLD:   0.644965 ±   0.002755
+Maximum KLD:  18.493736
+99.9%   KLD:  10.059598
+99.0%   KLD:   5.407475
+95.0%   KLD:   2.364230
+90.0%   KLD:   1.477545
+Median  KLD:   0.339213
+10.0%   KLD:   0.010624
+ 5.0%   KLD:   0.002467
+ 1.0%   KLD:   0.000277
+ 0.1%   KLD:   0.000030
+Minimum KLD:  -0.000000
+
+====== Token probability statistics ======
+Mean    Δp: -7.810 ± 0.058 %
+Maximum Δp: 99.884%
+99.9%   Δp: 73.625%
+99.0%   Δp: 40.369%
+95.0%   Δp: 16.588%
+90.0%   Δp:  7.372%
+75.0%   Δp:  0.201%
+Median  Δp: -0.916%
+25.0%   Δp: -11.370%
+10.0%   Δp: -33.838%
+ 5.0%   Δp: -54.602%
+ 1.0%   Δp: -93.772%
+ 0.1%   Δp: -99.844%
+Minimum Δp: -99.999%
+RMS Δp    : 23.380 ± 0.085 %
+Same top p: 67.231 ± 0.124 %
--- a/scores/granite-4.1-8b-q2_k.tqa
+++ b/scores/granite-4.1-8b-q2_k.tqa
@@ -0,0 +1,21 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q2_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:   35 tensors
+llama_model_loader: - type q3_K:    1 tensors
+llama_model_loader: - type iq2_xxs:   41 tensors
+llama_model_loader: - type iq2_xs:   56 tensors
+llama_model_loader: - type iq3_xxs:    6 tensors
+llama_model_loader: - type iq1_s:    2 tensors
+llama_model_loader: - type iq3_s:   38 tensors
+llama_model_loader: - type iq2_s:   99 tensors
+llama_model_loader: - type iq1_m:    4 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ2_S - 2.5 bpw
+print_info: file size   = 2.56 GiB (2.50 BPW) 
+
+multiple_choice_score: there are 817 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 817 tasks available
+multiple_choice_score : calculating TruthfulQA score over 750 tasks.
+
+Final result: 33.4667 +/- 1.7242
+Random chance: 19.8992 +/- 1.4588
--- a/scores/granite-4.1-8b-q2_k.wng
+++ b/scores/granite-4.1-8b-q2_k.wng
@@ -0,0 +1,19 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q2_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:   35 tensors
+llama_model_loader: - type q3_K:    1 tensors
+llama_model_loader: - type iq2_xxs:   41 tensors
+llama_model_loader: - type iq2_xs:   56 tensors
+llama_model_loader: - type iq3_xxs:    6 tensors
+llama_model_loader: - type iq1_s:    2 tensors
+llama_model_loader: - type iq3_s:   38 tensors
+llama_model_loader: - type iq2_s:   99 tensors
+llama_model_loader: - type iq1_m:    4 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ2_S - 2.5 bpw
+print_info: file size   = 2.56 GiB (2.50 BPW) 
+
+winogrande_score : loaded 1266 tasks from prompt.
+winogrande_score : selecting 750 random tasks
+
+Final Winogrande score(750 tasks): 65.2000 +/- 1.7405
--- a/scores/granite-4.1-8b-q3_k.arc
+++ b/scores/granite-4.1-8b-q3_k.arc
@@ -0,0 +1,20 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q3_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:    1 tensors
+llama_model_loader: - type q3_K:    1 tensors
+llama_model_loader: - type q4_K:   33 tensors
+llama_model_loader: - type iq2_xxs:    1 tensors
+llama_model_loader: - type iq2_xs:    2 tensors
+llama_model_loader: - type iq3_xxs:   31 tensors
+llama_model_loader: - type iq3_s:  165 tensors
+llama_model_loader: - type iq4_xs:   48 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ4_XS - 4.25 bpw
+print_info: file size   = 3.58 GiB (3.50 BPW) 
+
+multiple_choice_score: there are 869 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 869 tasks available
+multiple_choice_score : calculating ARC Challenge score over 750 tasks.
+
+Final result: 62.0000 +/- 1.7736
+Random chance: 25.0083 +/- 1.5824
--- a/scores/granite-4.1-8b-q3_k.gpqa
+++ b/scores/granite-4.1-8b-q3_k.gpqa
@@ -0,0 +1,20 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q3_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:    1 tensors
+llama_model_loader: - type q3_K:    1 tensors
+llama_model_loader: - type q4_K:   33 tensors
+llama_model_loader: - type iq2_xxs:    1 tensors
+llama_model_loader: - type iq2_xs:    2 tensors
+llama_model_loader: - type iq3_xxs:   31 tensors
+llama_model_loader: - type iq3_s:  165 tensors
+llama_model_loader: - type iq4_xs:   48 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ4_XS - 4.25 bpw
+print_info: file size   = 3.58 GiB (3.50 BPW) 
+
+multiple_choice_score: there are 198 tasks in prompt
+multiple_choice_score: reading tasks......................................................................................................................................................................................................done
+multiple_choice_score : calculating GPQA-Diamond score over 198 tasks.
+
+Final result: 21.7172 +/- 2.9377
+Random chance: 24.5963 +/- 3.0683
--- a/scores/granite-4.1-8b-q3_k.hsw
+++ b/scores/granite-4.1-8b-q3_k.hsw
@@ -0,0 +1,19 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q3_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:    1 tensors
+llama_model_loader: - type q3_K:    1 tensors
+llama_model_loader: - type q4_K:   33 tensors
+llama_model_loader: - type iq2_xxs:    1 tensors
+llama_model_loader: - type iq2_xs:    2 tensors
+llama_model_loader: - type iq3_xxs:   31 tensors
+llama_model_loader: - type iq3_s:  165 tensors
+llama_model_loader: - type iq4_xs:   48 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ4_XS - 4.25 bpw
+print_info: file size   = 3.58 GiB (3.50 BPW) 
+
+hellaswag_score : loaded 10042 tasks from prompt.
+hellaswag_score : selecting 750 randomized tasks.
+hellaswag_score : calculating hellaswag score over selected tasks.
+
+750	79.33333333%	[76.2895%, 82.0782%]
--- a/scores/granite-4.1-8b-q3_k.mmlu
+++ b/scores/granite-4.1-8b-q3_k.mmlu
@@ -0,0 +1,20 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q3_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:    1 tensors
+llama_model_loader: - type q3_K:    1 tensors
+llama_model_loader: - type q4_K:   33 tensors
+llama_model_loader: - type iq2_xxs:    1 tensors
+llama_model_loader: - type iq2_xs:    2 tensors
+llama_model_loader: - type iq3_xxs:   31 tensors
+llama_model_loader: - type iq3_s:  165 tensors
+llama_model_loader: - type iq4_xs:   48 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ4_XS - 4.25 bpw
+print_info: file size   = 3.58 GiB (3.50 BPW) 
+
+multiple_choice_score: there are 5362 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 5362 tasks available
+multiple_choice_score : calculating MMLU-Redux score over 750 tasks.
+
+Final result: 69.2000 +/- 1.6869
+Random chance: 25.0000 +/- 1.5822
--- a/scores/granite-4.1-8b-q3_k.ppx
+++ b/scores/granite-4.1-8b-q3_k.ppx
@@ -0,0 +1,54 @@
+Will perform strided perplexity calculation -> adjusting context size from 3072 to 3264
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q3_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:    1 tensors
+llama_model_loader: - type q3_K:    1 tensors
+llama_model_loader: - type q4_K:   33 tensors
+llama_model_loader: - type iq2_xxs:    1 tensors
+llama_model_loader: - type iq2_xs:    2 tensors
+llama_model_loader: - type iq3_xxs:   31 tensors
+llama_model_loader: - type iq3_s:  165 tensors
+llama_model_loader: - type iq4_xs:   48 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ4_XS - 4.25 bpw
+print_info: file size   = 3.58 GiB (3.50 BPW) 
+
+====== Perplexity statistics ======
+Mean PPL(Q)                   :   9.381594 ±   0.070128
+Mean PPL(base)                :   8.691178 ±   0.065443
+Cor(ln(PPL(Q)), ln(PPL(base))):  96.18%
+Mean ln(PPL(Q)/PPL(base))     :   0.076441 ±   0.002075
+Mean PPL(Q)/PPL(base)         :   1.079439 ±   0.002240
+Mean PPL(Q)-PPL(base)         :   0.690416 ±   0.019310
+
+====== KL divergence statistics ======
+Mean    KLD:   0.173887 ±   0.001079
+Maximum KLD:  14.743266
+99.9%   KLD:   5.111659
+99.0%   KLD:   1.928733
+95.0%   KLD:   0.623000
+90.0%   KLD:   0.364871
+Median  KLD:   0.072451
+10.0%   KLD:   0.001391
+ 5.0%   KLD:   0.000306
+ 1.0%   KLD:   0.000027
+ 0.1%   KLD:   0.000001
+Minimum KLD:  -0.000004
+
+====== Token probability statistics ======
+Mean    Δp: -2.503 ± 0.031 %
+Maximum Δp: 96.204%
+99.9%   Δp: 57.084%
+99.0%   Δp: 26.183%
+95.0%   Δp: 10.344%
+90.0%   Δp:  5.013%
+75.0%   Δp:  0.347%
+Median  Δp: -0.138%
+25.0%   Δp: -3.676%
+10.0%   Δp: -12.687%
+ 5.0%   Δp: -21.160%
+ 1.0%   Δp: -51.918%
+ 0.1%   Δp: -92.971%
+Minimum Δp: -99.997%
+RMS Δp    : 12.185 ± 0.069 %
+Same top p: 82.732 ± 0.100 %
--- a/scores/granite-4.1-8b-q3_k.tqa
+++ b/scores/granite-4.1-8b-q3_k.tqa
@@ -0,0 +1,20 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q3_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:    1 tensors
+llama_model_loader: - type q3_K:    1 tensors
+llama_model_loader: - type q4_K:   33 tensors
+llama_model_loader: - type iq2_xxs:    1 tensors
+llama_model_loader: - type iq2_xs:    2 tensors
+llama_model_loader: - type iq3_xxs:   31 tensors
+llama_model_loader: - type iq3_s:  165 tensors
+llama_model_loader: - type iq4_xs:   48 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ4_XS - 4.25 bpw
+print_info: file size   = 3.58 GiB (3.50 BPW) 
+
+multiple_choice_score: there are 817 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 817 tasks available
+multiple_choice_score : calculating TruthfulQA score over 750 tasks.
+
+Final result: 39.6000 +/- 1.7870
+Random chance: 19.8992 +/- 1.4588
--- a/scores/granite-4.1-8b-q3_k.wng
+++ b/scores/granite-4.1-8b-q3_k.wng
@@ -0,0 +1,18 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q3_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q2_K:    1 tensors
+llama_model_loader: - type q3_K:    1 tensors
+llama_model_loader: - type q4_K:   33 tensors
+llama_model_loader: - type iq2_xxs:    1 tensors
+llama_model_loader: - type iq2_xs:    2 tensors
+llama_model_loader: - type iq3_xxs:   31 tensors
+llama_model_loader: - type iq3_s:  165 tensors
+llama_model_loader: - type iq4_xs:   48 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = IQ4_XS - 4.25 bpw
+print_info: file size   = 3.58 GiB (3.50 BPW) 
+
+winogrande_score : loaded 1266 tasks from prompt.
+winogrande_score : selecting 750 random tasks
+
+Final Winogrande score(750 tasks): 71.7333 +/- 1.6453
--- a/scores/granite-4.1-8b-q4_k.arc
+++ b/scores/granite-4.1-8b-q4_k.arc
@@ -0,0 +1,17 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q4_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q4_K:   90 tensors
+llama_model_loader: - type q5_K:   79 tensors
+llama_model_loader: - type iq3_xxs:    2 tensors
+llama_model_loader: - type iq3_s:    1 tensors
+llama_model_loader: - type iq4_xs:  110 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q4_K - Medium
+print_info: file size   = 4.61 GiB (4.50 BPW) 
+
+multiple_choice_score: there are 869 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 869 tasks available
+multiple_choice_score : calculating ARC Challenge score over 750 tasks.
+
+Final result: 66.9333 +/- 1.7190
+Random chance: 25.0083 +/- 1.5824
--- a/scores/granite-4.1-8b-q4_k.gpqa
+++ b/scores/granite-4.1-8b-q4_k.gpqa
@@ -0,0 +1,17 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q4_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q4_K:   90 tensors
+llama_model_loader: - type q5_K:   79 tensors
+llama_model_loader: - type iq3_xxs:    2 tensors
+llama_model_loader: - type iq3_s:    1 tensors
+llama_model_loader: - type iq4_xs:  110 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q4_K - Medium
+print_info: file size   = 4.61 GiB (4.50 BPW) 
+
+multiple_choice_score: there are 198 tasks in prompt
+multiple_choice_score: reading tasks......................................................................................................................................................................................................done
+multiple_choice_score : calculating GPQA-Diamond score over 198 tasks.
+
+Final result: 23.2323 +/- 3.0089
+Random chance: 24.5963 +/- 3.0683
--- a/scores/granite-4.1-8b-q4_k.hsw
+++ b/scores/granite-4.1-8b-q4_k.hsw
@@ -0,0 +1,16 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q4_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q4_K:   90 tensors
+llama_model_loader: - type q5_K:   79 tensors
+llama_model_loader: - type iq3_xxs:    2 tensors
+llama_model_loader: - type iq3_s:    1 tensors
+llama_model_loader: - type iq4_xs:  110 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q4_K - Medium
+print_info: file size   = 4.61 GiB (4.50 BPW) 
+
+hellaswag_score : loaded 10042 tasks from prompt.
+hellaswag_score : selecting 750 randomized tasks.
+hellaswag_score : calculating hellaswag score over selected tasks.
+
+750	79.73333333%	[76.7082%, 82.4554%]
--- a/scores/granite-4.1-8b-q4_k.mmlu
+++ b/scores/granite-4.1-8b-q4_k.mmlu
@@ -0,0 +1,17 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q4_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q4_K:   90 tensors
+llama_model_loader: - type q5_K:   79 tensors
+llama_model_loader: - type iq3_xxs:    2 tensors
+llama_model_loader: - type iq3_s:    1 tensors
+llama_model_loader: - type iq4_xs:  110 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q4_K - Medium
+print_info: file size   = 4.61 GiB (4.50 BPW) 
+
+multiple_choice_score: there are 5362 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 5362 tasks available
+multiple_choice_score : calculating MMLU-Redux score over 750 tasks.
+
+Final result: 71.4667 +/- 1.6500
+Random chance: 25.0000 +/- 1.5822
--- a/scores/granite-4.1-8b-q4_k.ppx
+++ b/scores/granite-4.1-8b-q4_k.ppx
@@ -0,0 +1,51 @@
+Will perform strided perplexity calculation -> adjusting context size from 3072 to 3264
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q4_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q4_K:   90 tensors
+llama_model_loader: - type q5_K:   79 tensors
+llama_model_loader: - type iq3_xxs:    2 tensors
+llama_model_loader: - type iq3_s:    1 tensors
+llama_model_loader: - type iq4_xs:  110 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q4_K - Medium
+print_info: file size   = 4.61 GiB (4.50 BPW) 
+
+====== Perplexity statistics ======
+Mean PPL(Q)                   :   8.867438 ±   0.067303
+Mean PPL(base)                :   8.691178 ±   0.065443
+Cor(ln(PPL(Q)), ln(PPL(base))):  98.88%
+Mean ln(PPL(Q)/PPL(base))     :   0.020077 ±   0.001134
+Mean PPL(Q)/PPL(base)         :   1.020280 ±   0.001157
+Mean PPL(Q)-PPL(base)         :   0.176260 ±   0.010114
+
+====== KL divergence statistics ======
+Mean    KLD:   0.047917 ±   0.000392
+Maximum KLD:   8.513770
+99.9%   KLD:   1.939411
+99.0%   KLD:   0.563371
+95.0%   KLD:   0.167563
+90.0%   KLD:   0.095562
+Median  KLD:   0.017061
+10.0%   KLD:   0.000210
+ 5.0%   KLD:   0.000043
+ 1.0%   KLD:   0.000003
+ 0.1%   KLD:  -0.000001
+Minimum KLD:  -0.000004
+
+====== Token probability statistics ======
+Mean    Δp: -0.365 ± 0.017 %
+Maximum Δp: 95.922%
+99.9%   Δp: 43.653%
+99.0%   Δp: 16.925%
+95.0%   Δp:  6.946%
+90.0%   Δp:  3.742%
+75.0%   Δp:  0.557%
+Median  Δp: -0.002%
+25.0%   Δp: -0.901%
+10.0%   Δp: -4.570%
+ 5.0%   Δp: -8.319%
+ 1.0%   Δp: -22.260%
+ 0.1%   Δp: -58.978%
+Minimum Δp: -98.363%
+RMS Δp    :  6.446 ± 0.053 %
+Same top p: 90.937 ± 0.076 %
--- a/scores/granite-4.1-8b-q4_k.tqa
+++ b/scores/granite-4.1-8b-q4_k.tqa
@@ -0,0 +1,17 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q4_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q4_K:   90 tensors
+llama_model_loader: - type q5_K:   79 tensors
+llama_model_loader: - type iq3_xxs:    2 tensors
+llama_model_loader: - type iq3_s:    1 tensors
+llama_model_loader: - type iq4_xs:  110 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q4_K - Medium
+print_info: file size   = 4.61 GiB (4.50 BPW) 
+
+multiple_choice_score: there are 817 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 817 tasks available
+multiple_choice_score : calculating TruthfulQA score over 750 tasks.
+
+Final result: 38.9333 +/- 1.7816
+Random chance: 19.8992 +/- 1.4588
--- a/scores/granite-4.1-8b-q4_k.wng
+++ b/scores/granite-4.1-8b-q4_k.wng
@@ -0,0 +1,15 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q4_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q4_K:   90 tensors
+llama_model_loader: - type q5_K:   79 tensors
+llama_model_loader: - type iq3_xxs:    2 tensors
+llama_model_loader: - type iq3_s:    1 tensors
+llama_model_loader: - type iq4_xs:  110 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q4_K - Medium
+print_info: file size   = 4.61 GiB (4.50 BPW) 
+
+winogrande_score : loaded 1266 tasks from prompt.
+winogrande_score : selecting 750 random tasks
+
+Final Winogrande score(750 tasks): 73.4667 +/- 1.6132
--- a/scores/granite-4.1-8b-q5_k.arc
+++ b/scores/granite-4.1-8b-q5_k.arc
@@ -0,0 +1,17 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q5_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    1 tensors
+llama_model_loader: - type q4_K:   26 tensors
+llama_model_loader: - type q5_K:  246 tensors
+llama_model_loader: - type q6_K:    4 tensors
+llama_model_loader: - type iq4_xs:    5 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q5_K - Medium
+print_info: file size   = 5.63 GiB (5.50 BPW) 
+
+multiple_choice_score: there are 869 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 869 tasks available
+multiple_choice_score : calculating ARC Challenge score over 750 tasks.
+
+Final result: 66.4000 +/- 1.7259
+Random chance: 25.0083 +/- 1.5824
--- a/scores/granite-4.1-8b-q5_k.gpqa
+++ b/scores/granite-4.1-8b-q5_k.gpqa
@@ -0,0 +1,17 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q5_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    1 tensors
+llama_model_loader: - type q4_K:   26 tensors
+llama_model_loader: - type q5_K:  246 tensors
+llama_model_loader: - type q6_K:    4 tensors
+llama_model_loader: - type iq4_xs:    5 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q5_K - Medium
+print_info: file size   = 5.63 GiB (5.50 BPW) 
+
+multiple_choice_score: there are 198 tasks in prompt
+multiple_choice_score: reading tasks......................................................................................................................................................................................................done
+multiple_choice_score : calculating GPQA-Diamond score over 198 tasks.
+
+Final result: 22.7273 +/- 2.9858
+Random chance: 24.5963 +/- 3.0683
--- a/scores/granite-4.1-8b-q5_k.hsw
+++ b/scores/granite-4.1-8b-q5_k.hsw
@@ -0,0 +1,16 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q5_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    1 tensors
+llama_model_loader: - type q4_K:   26 tensors
+llama_model_loader: - type q5_K:  246 tensors
+llama_model_loader: - type q6_K:    4 tensors
+llama_model_loader: - type iq4_xs:    5 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q5_K - Medium
+print_info: file size   = 5.63 GiB (5.50 BPW) 
+
+hellaswag_score : loaded 10042 tasks from prompt.
+hellaswag_score : selecting 750 randomized tasks.
+hellaswag_score : calculating hellaswag score over selected tasks.
+
+750	79.86666667%	[76.8479%, 82.5810%]
--- a/scores/granite-4.1-8b-q5_k.mmlu
+++ b/scores/granite-4.1-8b-q5_k.mmlu
@@ -0,0 +1,17 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q5_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    1 tensors
+llama_model_loader: - type q4_K:   26 tensors
+llama_model_loader: - type q5_K:  246 tensors
+llama_model_loader: - type q6_K:    4 tensors
+llama_model_loader: - type iq4_xs:    5 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q5_K - Medium
+print_info: file size   = 5.63 GiB (5.50 BPW) 
+
+multiple_choice_score: there are 5362 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 5362 tasks available
+multiple_choice_score : calculating MMLU-Redux score over 750 tasks.
+
+Final result: 72.1333 +/- 1.6382
+Random chance: 25.0000 +/- 1.5822
--- a/scores/granite-4.1-8b-q5_k.ppx
+++ b/scores/granite-4.1-8b-q5_k.ppx
@@ -0,0 +1,51 @@
+Will perform strided perplexity calculation -> adjusting context size from 3072 to 3264
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q5_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    1 tensors
+llama_model_loader: - type q4_K:   26 tensors
+llama_model_loader: - type q5_K:  246 tensors
+llama_model_loader: - type q6_K:    4 tensors
+llama_model_loader: - type iq4_xs:    5 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q5_K - Medium
+print_info: file size   = 5.63 GiB (5.50 BPW) 
+
+====== Perplexity statistics ======
+Mean PPL(Q)                   :   8.766150 ±   0.066421
+Mean PPL(base)                :   8.691178 ±   0.065443
+Cor(ln(PPL(Q)), ln(PPL(base))):  99.48%
+Mean ln(PPL(Q)/PPL(base))     :   0.008589 ±   0.000770
+Mean PPL(Q)/PPL(base)         :   1.008626 ±   0.000776
+Mean PPL(Q)-PPL(base)         :   0.074972 ±   0.006775
+
+====== KL divergence statistics ======
+Mean    KLD:   0.018940 ±   0.000165
+Maximum KLD:   5.148437
+99.9%   KLD:   0.762867
+99.0%   KLD:   0.213410
+95.0%   KLD:   0.065414
+90.0%   KLD:   0.037975
+Median  KLD:   0.006922
+10.0%   KLD:   0.000082
+ 5.0%   KLD:   0.000017
+ 1.0%   KLD:   0.000001
+ 0.1%   KLD:  -0.000003
+Minimum KLD:  -0.000006
+
+====== Token probability statistics ======
+Mean    Δp: -0.182 ± 0.011 %
+Maximum Δp: 91.879%
+99.9%   Δp: 30.364%
+99.0%   Δp: 10.955%
+95.0%   Δp:  4.408%
+90.0%   Δp:  2.363%
+75.0%   Δp:  0.367%
+Median  Δp: -0.001%
+25.0%   Δp: -0.575%
+10.0%   Δp: -2.918%
+ 5.0%   Δp: -5.194%
+ 1.0%   Δp: -12.983%
+ 0.1%   Δp: -33.902%
+Minimum Δp: -90.554%
+RMS Δp    :  4.061 ± 0.040 %
+Same top p: 94.120 ± 0.062 %
--- a/scores/granite-4.1-8b-q5_k.tqa
+++ b/scores/granite-4.1-8b-q5_k.tqa
@@ -0,0 +1,17 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q5_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    1 tensors
+llama_model_loader: - type q4_K:   26 tensors
+llama_model_loader: - type q5_K:  246 tensors
+llama_model_loader: - type q6_K:    4 tensors
+llama_model_loader: - type iq4_xs:    5 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q5_K - Medium
+print_info: file size   = 5.63 GiB (5.50 BPW) 
+
+multiple_choice_score: there are 817 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 817 tasks available
+multiple_choice_score : calculating TruthfulQA score over 750 tasks.
+
+Final result: 38.5333 +/- 1.7783
+Random chance: 19.8992 +/- 1.4588
--- a/scores/granite-4.1-8b-q5_k.wng
+++ b/scores/granite-4.1-8b-q5_k.wng
@@ -0,0 +1,15 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q5_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    1 tensors
+llama_model_loader: - type q4_K:   26 tensors
+llama_model_loader: - type q5_K:  246 tensors
+llama_model_loader: - type q6_K:    4 tensors
+llama_model_loader: - type iq4_xs:    5 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q5_K - Medium
+print_info: file size   = 5.63 GiB (5.50 BPW) 
+
+winogrande_score : loaded 1266 tasks from prompt.
+winogrande_score : selecting 750 random tasks
+
+Final Winogrande score(750 tasks): 73.4667 +/- 1.6132
--- a/scores/granite-4.1-8b-q6_k.arc
+++ b/scores/granite-4.1-8b-q6_k.arc
@@ -0,0 +1,16 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q6_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q8_0:   35 tensors
+llama_model_loader: - type q4_K:    2 tensors
+llama_model_loader: - type q5_K:   75 tensors
+llama_model_loader: - type q6_K:  170 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q6_K
+print_info: file size   = 6.65 GiB (6.50 BPW) 
+
+multiple_choice_score: there are 869 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 869 tasks available
+multiple_choice_score : calculating ARC Challenge score over 750 tasks.
+
+Final result: 67.0667 +/- 1.7172
+Random chance: 25.0083 +/- 1.5824
--- a/scores/granite-4.1-8b-q6_k.gpqa
+++ b/scores/granite-4.1-8b-q6_k.gpqa
@@ -0,0 +1,16 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q6_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q8_0:   35 tensors
+llama_model_loader: - type q4_K:    2 tensors
+llama_model_loader: - type q5_K:   75 tensors
+llama_model_loader: - type q6_K:  170 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q6_K
+print_info: file size   = 6.65 GiB (6.50 BPW) 
+
+multiple_choice_score: there are 198 tasks in prompt
+multiple_choice_score: reading tasks......................................................................................................................................................................................................done
+multiple_choice_score : calculating GPQA-Diamond score over 198 tasks.
+
+Final result: 24.7475 +/- 3.0746
+Random chance: 24.5963 +/- 3.0683
--- a/scores/granite-4.1-8b-q6_k.hsw
+++ b/scores/granite-4.1-8b-q6_k.hsw
@@ -0,0 +1,15 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q6_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q8_0:   35 tensors
+llama_model_loader: - type q4_K:    2 tensors
+llama_model_loader: - type q5_K:   75 tensors
+llama_model_loader: - type q6_K:  170 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q6_K
+print_info: file size   = 6.65 GiB (6.50 BPW) 
+
+hellaswag_score : loaded 10042 tasks from prompt.
+hellaswag_score : selecting 750 randomized tasks.
+hellaswag_score : calculating hellaswag score over selected tasks.
+
+750	80.13333333%	[77.1274%, 82.8322%]
--- a/scores/granite-4.1-8b-q6_k.mmlu
+++ b/scores/granite-4.1-8b-q6_k.mmlu
@@ -0,0 +1,16 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q6_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q8_0:   35 tensors
+llama_model_loader: - type q4_K:    2 tensors
+llama_model_loader: - type q5_K:   75 tensors
+llama_model_loader: - type q6_K:  170 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q6_K
+print_info: file size   = 6.65 GiB (6.50 BPW) 
+
+multiple_choice_score: there are 5362 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 5362 tasks available
+multiple_choice_score : calculating MMLU-Redux score over 750 tasks.
+
+Final result: 72.6667 +/- 1.6284
+Random chance: 25.0000 +/- 1.5822
--- a/scores/granite-4.1-8b-q6_k.ppx
+++ b/scores/granite-4.1-8b-q6_k.ppx
@@ -0,0 +1,50 @@
+Will perform strided perplexity calculation -> adjusting context size from 3072 to 3264
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q6_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q8_0:   35 tensors
+llama_model_loader: - type q4_K:    2 tensors
+llama_model_loader: - type q5_K:   75 tensors
+llama_model_loader: - type q6_K:  170 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q6_K
+print_info: file size   = 6.65 GiB (6.50 BPW) 
+
+====== Perplexity statistics ======
+Mean PPL(Q)                   :   8.755199 ±   0.066400
+Mean PPL(base)                :   8.691178 ±   0.065443
+Cor(ln(PPL(Q)), ln(PPL(base))):  99.74%
+Mean ln(PPL(Q)/PPL(base))     :   0.007339 ±   0.000550
+Mean PPL(Q)/PPL(base)         :   1.007366 ±   0.000554
+Mean PPL(Q)-PPL(base)         :   0.064021 ±   0.004871
+
+====== KL divergence statistics ======
+Mean    KLD:   0.007326 ±   0.000066
+Maximum KLD:   2.273445
+99.9%   KLD:   0.273010
+99.0%   KLD:   0.081142
+95.0%   KLD:   0.025136
+90.0%   KLD:   0.014795
+Median  KLD:   0.002831
+10.0%   KLD:   0.000033
+ 5.0%   KLD:   0.000007
+ 1.0%   KLD:   0.000000
+ 0.1%   KLD:  -0.000003
+Minimum KLD:  -0.000027
+
+====== Token probability statistics ======
+Mean    Δp: -0.107 ± 0.007 %
+Maximum Δp: 79.111%
+99.9%   Δp: 18.154%
+99.0%   Δp:  7.012%
+95.0%   Δp:  2.856%
+90.0%   Δp:  1.538%
+75.0%   Δp:  0.232%
+Median  Δp: -0.001%
+25.0%   Δp: -0.371%
+10.0%   Δp: -1.892%
+ 5.0%   Δp: -3.299%
+ 1.0%   Δp: -7.834%
+ 0.1%   Δp: -21.254%
+Minimum Δp: -87.374%
+RMS Δp    :  2.562 ± 0.030 %
+Same top p: 96.165 ± 0.051 %
--- a/scores/granite-4.1-8b-q6_k.tqa
+++ b/scores/granite-4.1-8b-q6_k.tqa
@@ -0,0 +1,16 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q6_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q8_0:   35 tensors
+llama_model_loader: - type q4_K:    2 tensors
+llama_model_loader: - type q5_K:   75 tensors
+llama_model_loader: - type q6_K:  170 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q6_K
+print_info: file size   = 6.65 GiB (6.50 BPW) 
+
+multiple_choice_score: there are 817 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 817 tasks available
+multiple_choice_score : calculating TruthfulQA score over 750 tasks.
+
+Final result: 38.2667 +/- 1.7759
+Random chance: 19.8992 +/- 1.4588
--- a/scores/granite-4.1-8b-q6_k.wng
+++ b/scores/granite-4.1-8b-q6_k.wng
@@ -0,0 +1,14 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q6_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q8_0:   35 tensors
+llama_model_loader: - type q4_K:    2 tensors
+llama_model_loader: - type q5_K:   75 tensors
+llama_model_loader: - type q6_K:  170 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q6_K
+print_info: file size   = 6.65 GiB (6.50 BPW) 
+
+winogrande_score : loaded 1266 tasks from prompt.
+winogrande_score : selecting 750 random tasks
+
+Final Winogrande score(750 tasks): 73.7333 +/- 1.6080
--- a/scores/granite-4.1-8b-q7_k.arc
+++ b/scores/granite-4.1-8b-q7_k.arc
@@ -0,0 +1,15 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q7_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    4 tensors
+llama_model_loader: - type q8_0:  146 tensors
+llama_model_loader: - type q6_K:  132 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q8_0
+print_info: file size   = 7.68 GiB (7.50 BPW) 
+
+multiple_choice_score: there are 869 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 869 tasks available
+multiple_choice_score : calculating ARC Challenge score over 750 tasks.
+
+Final result: 66.4000 +/- 1.7259
+Random chance: 25.0083 +/- 1.5824
--- a/scores/granite-4.1-8b-q7_k.gpqa
+++ b/scores/granite-4.1-8b-q7_k.gpqa
@@ -0,0 +1,15 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q7_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    4 tensors
+llama_model_loader: - type q8_0:  146 tensors
+llama_model_loader: - type q6_K:  132 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q8_0
+print_info: file size   = 7.68 GiB (7.50 BPW) 
+
+multiple_choice_score: there are 198 tasks in prompt
+multiple_choice_score: reading tasks......................................................................................................................................................................................................done
+multiple_choice_score : calculating GPQA-Diamond score over 198 tasks.
+
+Final result: 26.7677 +/- 3.1544
+Random chance: 24.5963 +/- 3.0683
--- a/scores/granite-4.1-8b-q7_k.hsw
+++ b/scores/granite-4.1-8b-q7_k.hsw
@@ -0,0 +1,14 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q7_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    4 tensors
+llama_model_loader: - type q8_0:  146 tensors
+llama_model_loader: - type q6_K:  132 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q8_0
+print_info: file size   = 7.68 GiB (7.50 BPW) 
+
+hellaswag_score : loaded 10042 tasks from prompt.
+hellaswag_score : selecting 750 randomized tasks.
+hellaswag_score : calculating hellaswag score over selected tasks.
+
+750	80.26666667%	[77.2672%, 82.9576%]
--- a/scores/granite-4.1-8b-q7_k.mmlu
+++ b/scores/granite-4.1-8b-q7_k.mmlu
@@ -0,0 +1,15 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q7_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    4 tensors
+llama_model_loader: - type q8_0:  146 tensors
+llama_model_loader: - type q6_K:  132 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q8_0
+print_info: file size   = 7.68 GiB (7.50 BPW) 
+
+multiple_choice_score: there are 5362 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 5362 tasks available
+multiple_choice_score : calculating MMLU-Redux score over 750 tasks.
+
+Final result: 72.1333 +/- 1.6382
+Random chance: 25.0000 +/- 1.5822
--- a/scores/granite-4.1-8b-q7_k.ppx
+++ b/scores/granite-4.1-8b-q7_k.ppx
@@ -0,0 +1,49 @@
+Will perform strided perplexity calculation -> adjusting context size from 3072 to 3264
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q7_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    4 tensors
+llama_model_loader: - type q8_0:  146 tensors
+llama_model_loader: - type q6_K:  132 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q8_0
+print_info: file size   = 7.68 GiB (7.50 BPW) 
+
+====== Perplexity statistics ======
+Mean PPL(Q)                   :   8.751241 ±   0.066500
+Mean PPL(base)                :   8.691178 ±   0.065443
+Cor(ln(PPL(Q)), ln(PPL(base))):  99.82%
+Mean ln(PPL(Q)/PPL(base))     :   0.006887 ±   0.000464
+Mean PPL(Q)/PPL(base)         :   1.006911 ±   0.000467
+Mean PPL(Q)-PPL(base)         :   0.060063 ±   0.004141
+
+====== KL divergence statistics ======
+Mean    KLD:   0.003568 ±   0.000040
+Maximum KLD:   2.888946
+99.9%   KLD:   0.140997
+99.0%   KLD:   0.037132
+95.0%   KLD:   0.011608
+90.0%   KLD:   0.006961
+Median  KLD:   0.001456
+10.0%   KLD:   0.000015
+ 5.0%   KLD:   0.000003
+ 1.0%   KLD:  -0.000000
+ 0.1%   KLD:  -0.000004
+Minimum KLD:  -0.000012
+
+====== Token probability statistics ======
+Mean    Δp: -0.007 ± 0.005 %
+Maximum Δp: 81.280%
+99.9%   Δp: 12.574%
+99.0%   Δp:  4.968%
+95.0%   Δp:  2.242%
+90.0%   Δp:  1.259%
+75.0%   Δp:  0.222%
+Median  Δp: -0.000%
+25.0%   Δp: -0.211%
+10.0%   Δp: -1.245%
+ 5.0%   Δp: -2.232%
+ 1.0%   Δp: -5.277%
+ 0.1%   Δp: -14.266%
+Minimum Δp: -57.371%
+RMS Δp    :  1.812 ± 0.025 %
+Same top p: 97.235 ± 0.043 %
--- a/scores/granite-4.1-8b-q7_k.tqa
+++ b/scores/granite-4.1-8b-q7_k.tqa
@@ -0,0 +1,15 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q7_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    4 tensors
+llama_model_loader: - type q8_0:  146 tensors
+llama_model_loader: - type q6_K:  132 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q8_0
+print_info: file size   = 7.68 GiB (7.50 BPW) 
+
+multiple_choice_score: there are 817 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 817 tasks available
+multiple_choice_score : calculating TruthfulQA score over 750 tasks.
+
+Final result: 38.5333 +/- 1.7783
+Random chance: 19.8992 +/- 1.4588
--- a/scores/granite-4.1-8b-q7_k.wng
+++ b/scores/granite-4.1-8b-q7_k.wng
@@ -0,0 +1,13 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q7_K.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    4 tensors
+llama_model_loader: - type q8_0:  146 tensors
+llama_model_loader: - type q6_K:  132 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q8_0
+print_info: file size   = 7.68 GiB (7.50 BPW) 
+
+winogrande_score : loaded 1266 tasks from prompt.
+winogrande_score : selecting 750 random tasks
+
+Final Winogrande score(750 tasks): 73.6000 +/- 1.6106
--- a/scores/granite-4.1-8b-q8_0.arc
+++ b/scores/granite-4.1-8b-q8_0.arc
@@ -0,0 +1,16 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q8_0.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    2 tensors
+llama_model_loader: - type q8_0:  266 tensors
+llama_model_loader: - type q6_K:    2 tensors
+llama_model_loader: - type bf16:   12 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q8_0
+print_info: file size   = 8.70 GiB (8.50 BPW) 
+
+multiple_choice_score: there are 869 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 869 tasks available
+multiple_choice_score : calculating ARC Challenge score over 750 tasks.
+
+Final result: 66.8000 +/- 1.7207
+Random chance: 25.0083 +/- 1.5824
--- a/scores/granite-4.1-8b-q8_0.gpqa
+++ b/scores/granite-4.1-8b-q8_0.gpqa
@@ -0,0 +1,16 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q8_0.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    2 tensors
+llama_model_loader: - type q8_0:  266 tensors
+llama_model_loader: - type q6_K:    2 tensors
+llama_model_loader: - type bf16:   12 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q8_0
+print_info: file size   = 8.70 GiB (8.50 BPW) 
+
+multiple_choice_score: there are 198 tasks in prompt
+multiple_choice_score: reading tasks......................................................................................................................................................................................................done
+multiple_choice_score : calculating GPQA-Diamond score over 198 tasks.
+
+Final result: 26.7677 +/- 3.1544
+Random chance: 24.5963 +/- 3.0683
--- a/scores/granite-4.1-8b-q8_0.hsw
+++ b/scores/granite-4.1-8b-q8_0.hsw
@@ -0,0 +1,15 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q8_0.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    2 tensors
+llama_model_loader: - type q8_0:  266 tensors
+llama_model_loader: - type q6_K:    2 tensors
+llama_model_loader: - type bf16:   12 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q8_0
+print_info: file size   = 8.70 GiB (8.50 BPW) 
+
+hellaswag_score : loaded 10042 tasks from prompt.
+hellaswag_score : selecting 750 randomized tasks.
+hellaswag_score : calculating hellaswag score over selected tasks.
+
+750	80.53333333%	[77.5470%, 83.2085%]
--- a/scores/granite-4.1-8b-q8_0.mmlu
+++ b/scores/granite-4.1-8b-q8_0.mmlu
@@ -0,0 +1,16 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q8_0.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    2 tensors
+llama_model_loader: - type q8_0:  266 tensors
+llama_model_loader: - type q6_K:    2 tensors
+llama_model_loader: - type bf16:   12 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q8_0
+print_info: file size   = 8.70 GiB (8.50 BPW) 
+
+multiple_choice_score: there are 5362 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 5362 tasks available
+multiple_choice_score : calculating MMLU-Redux score over 750 tasks.
+
+Final result: 72.4000 +/- 1.6334
+Random chance: 25.0000 +/- 1.5822
--- a/scores/granite-4.1-8b-q8_0.ppx
+++ b/scores/granite-4.1-8b-q8_0.ppx
@@ -0,0 +1,50 @@
+Will perform strided perplexity calculation -> adjusting context size from 3072 to 3264
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q8_0.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    2 tensors
+llama_model_loader: - type q8_0:  266 tensors
+llama_model_loader: - type q6_K:    2 tensors
+llama_model_loader: - type bf16:   12 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q8_0
+print_info: file size   = 8.70 GiB (8.50 BPW) 
+
+====== Perplexity statistics ======
+Mean PPL(Q)                   :   8.749119 ±   0.066517
+Mean PPL(base)                :   8.691178 ±   0.065443
+Cor(ln(PPL(Q)), ln(PPL(base))):  99.85%
+Mean ln(PPL(Q)/PPL(base))     :   0.006644 ±   0.000418
+Mean PPL(Q)/PPL(base)         :   1.006667 ±   0.000421
+Mean PPL(Q)-PPL(base)         :   0.057941 ±   0.003751
+
+====== KL divergence statistics ======
+Mean    KLD:   0.002052 ±   0.000024
+Maximum KLD:   1.924665
+99.9%   KLD:   0.070725
+99.0%   KLD:   0.018533
+95.0%   KLD:   0.006534
+90.0%   KLD:   0.004148
+Median  KLD:   0.000965
+10.0%   KLD:   0.000008
+ 5.0%   KLD:   0.000002
+ 1.0%   KLD:  -0.000001
+ 0.1%   KLD:  -0.000004
+Minimum KLD:  -0.000013
+
+====== Token probability statistics ======
+Mean    Δp:  0.031 ± 0.004 %
+Maximum Δp: 67.287%
+99.9%   Δp:  9.257%
+99.0%   Δp:  4.075%
+95.0%   Δp:  1.929%
+90.0%   Δp:  1.101%
+75.0%   Δp:  0.201%
+Median  Δp:  0.000%
+25.0%   Δp: -0.151%
+10.0%   Δp: -0.973%
+ 5.0%   Δp: -1.750%
+ 1.0%   Δp: -3.980%
+ 0.1%   Δp: -9.904%
+Minimum Δp: -53.630%
+RMS Δp    :  1.396 ± 0.020 %
+Same top p: 97.749 ± 0.039 %
--- a/scores/granite-4.1-8b-q8_0.tqa
+++ b/scores/granite-4.1-8b-q8_0.tqa
@@ -0,0 +1,16 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q8_0.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    2 tensors
+llama_model_loader: - type q8_0:  266 tensors
+llama_model_loader: - type q6_K:    2 tensors
+llama_model_loader: - type bf16:   12 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q8_0
+print_info: file size   = 8.70 GiB (8.50 BPW) 
+
+multiple_choice_score: there are 817 tasks in prompt
+multiple_choice_score: selecting 750 random tasks from 817 tasks available
+multiple_choice_score : calculating TruthfulQA score over 750 tasks.
+
+Final result: 38.4000 +/- 1.7771
+Random chance: 19.8992 +/- 1.4588
--- a/scores/granite-4.1-8b-q8_0.wng
+++ b/scores/granite-4.1-8b-q8_0.wng
@@ -0,0 +1,14 @@
+llama_model_loader: loaded meta data with 39 key-value pairs and 363 tensors from granite-4.1-8b-Q8_0.gguf (version GGUF V3 (latest))
+llama_model_loader: - type  f32:   81 tensors
+llama_model_loader: - type q5_1:    2 tensors
+llama_model_loader: - type q8_0:  266 tensors
+llama_model_loader: - type q6_K:    2 tensors
+llama_model_loader: - type bf16:   12 tensors
+print_info: file format = GGUF V3 (latest)
+print_info: file type   = Q8_0
+print_info: file size   = 8.70 GiB (8.50 BPW) 
+
+winogrande_score : loaded 1266 tasks from prompt.
+winogrande_score : selecting 750 random tasks
+
+Final Winogrande score(750 tasks): 73.2000 +/- 1.6184
--- a/scores/granite-4.1-8b.itx
+++ b/scores/granite-4.1-8b.itx
@@ -0,0 +1,332 @@
+ggml_cuda_init: found 1 CUDA devices (Total VRAM: 124610 MiB):
+  Device 0: NVIDIA GB10, compute capability 12.1, VMM: yes, VRAM: 124610 MiB
+
+Computing statistics for imatrix/imatrix-granite-4.1-8b-medium.gguf (280 tensors)
+
+ Layer	       Tensor	          Σ(Act²)	  Min	            Max	           μ	   σ	 % Active	N	   Entropy	E (norm)	ZD	  CosSim
+=========================================================================================================================================================================
+   39	attn_k              	 174643.00	  2.0243	 18914.7031	 42.64	497.38	  100.00%	  4096	    8.8904	 74.09%	      0.37%	  0.8865
+   38	attn_k              	 166087.69	  0.0000	 20050.7402	 40.55	448.81	   99.98%	  4096	    8.6133	 71.78%	      0.46%	  0.9835
+   37	attn_k              	 146614.73	  0.7595	 20756.5176	 35.79	423.56	  100.00%	  4096	    8.3834	 69.86%	      0.44%	  0.9842
+   36	attn_k              	 134513.23	  0.5200	 19003.3398	 32.84	386.52	  100.00%	  4096	    8.2079	 68.40%	      0.51%	  0.9501
+   35	attn_k              	 124035.38	  1.3198	 11533.5068	 30.28	305.84	  100.00%	  4096	    8.2914	 69.09%	      0.71%	  0.9665
+   34	attn_k              	 123896.47	  0.5387	 17763.3496	 30.25	472.60	  100.00%	  4096	    6.6833	 55.69%	      0.44%	  0.9800
+   32	attn_k              	 111128.92	  0.1590	 25305.4961	 27.13	504.76	  100.00%	  4096	    6.2867	 52.39%	      0.37%	  0.9931
+   30	attn_k              	 109705.93	  0.0000	 33505.8359	 26.78	617.29	   99.98%	  4096	    5.4138	 45.11%	      0.27%	  0.9759
+   33	attn_k              	 109045.48	  0.9963	 20537.8262	 26.62	448.68	  100.00%	  4096	    6.6424	 55.35%	      0.37%	  0.9914
+   29	attn_k              	  87316.21	  0.0000	 20308.4004	 21.32	398.84	   99.95%	  4096	    6.1991	 51.66%	      0.37%	  0.9936
+   31	attn_k              	  87185.37	  0.0000	 22471.5254	 21.29	421.05	   99.98%	  4096	    6.2130	 51.78%	      0.34%	  0.9963
+   28	attn_k              	  82016.98	  0.0000	 23024.2656	 20.02	430.64	   99.95%	  4096	    5.6830	 47.36%	      0.29%	  0.9976
+   27	attn_k              	  76821.73	  0.0000	 17911.5156	 18.76	348.43	   99.98%	  4096	    6.3444	 52.87%	      0.34%	  0.9791
+   16	attn_k              	  76133.66	  0.0000	 11891.1016	 18.59	311.73	   99.93%	  4096	    6.1208	 51.01%	      0.42%	  0.9643
+   23	attn_k              	  74987.37	  0.0000	 18502.6172	 18.31	356.15	   99.95%	  4096	    6.1167	 50.97%	      0.39%	  0.9980
+   22	attn_k              	  71226.52	  0.0000	 18282.5273	 17.39	343.00	   99.98%	  4096	    6.2861	 52.38%	      0.32%	  0.9901
+   21	attn_k              	  69479.59	  0.0000	 14531.5439	 16.96	297.70	   99.95%	  4096	    6.6280	 55.23%	      0.39%	  0.9882
+   20	attn_k              	  68286.74	  0.0000	 18747.7070	 16.67	345.57	   99.95%	  4096	    6.0506	 50.42%	      0.34%	  0.9917
+   25	attn_k              	  68221.13	  0.0000	 14562.2783	 16.66	294.34	   99.98%	  4096	    6.3805	 53.17%	      0.39%	  0.9829
+    7	attn_k              	  68092.71	  0.0000	 17005.3926	 16.62	348.43	   99.90%	  4096	    5.9826	 49.85%	      0.32%	  0.9814
+   18	attn_k              	  66295.24	  0.0000	 12255.0391	 16.19	262.31	   99.95%	  4096	    6.9157	 57.63%	      0.42%	  0.9978
+   26	attn_k              	  65291.02	  0.0000	 12545.3467	 15.94	268.54	   99.98%	  4096	    6.6067	 55.06%	      0.39%	  0.9920
+   13	attn_k              	  59896.29	  0.0000	  8712.0469	 14.62	232.75	   99.90%	  4096	    6.9162	 57.63%	      0.32%	  0.9786
+   24	attn_k              	  56921.47	  0.0000	  9241.3613	 13.90	213.49	   99.98%	  4096	    7.0602	 58.84%	      0.54%	  0.9757
+   17	attn_k              	  56760.55	  0.0000	 10113.2490	 13.86	223.49	   99.95%	  4096	    6.7278	 56.06%	      0.44%	  0.9569
+   15	attn_k              	  55194.11	  0.0000	  9697.7783	 13.48	229.94	   99.93%	  4096	    5.9460	 49.55%	      0.37%	  0.9288
+   14	attn_k              	  54794.45	  0.0000	  8291.7021	 13.38	212.09	   99.90%	  4096	    7.0371	 58.64%	      0.37%	  0.9885
+    6	attn_k              	  53044.36	  0.0000	 16721.8047	 12.95	321.79	   99.88%	  4096	    4.5291	 37.74%	      0.32%	  0.9479
+   19	attn_k              	  52733.22	  0.0000	 11920.8223	 12.87	233.97	   99.95%	  4096	    6.5100	 54.25%	      0.39%	  0.9902
+    8	attn_k              	  51986.04	  0.0000	 10429.2197	 12.69	233.14	   99.90%	  4096	    6.5500	 54.58%	      0.29%	  0.9699
+    9	attn_k              	  49641.15	  0.0000	 10131.9502	 12.12	241.91	   99.90%	  4096	    5.8877	 49.06%	      0.34%	  0.9950
+   12	attn_k              	  48607.36	  0.0000	  7781.5098	 11.87	191.06	   99.93%	  4096	    7.0521	 58.77%	      0.37%	  0.9965
+    4	attn_k              	  46316.68	  0.0000	 16862.5684	 11.31	309.35	   99.85%	  4096	    5.2333	 43.61%	      0.22%	  0.7166
+    5	attn_k              	  45620.26	  0.0000	 16766.0762	 11.14	317.06	   99.88%	  4096	    4.5011	 37.51%	      0.22%	  0.9947
+   11	attn_k              	  45317.79	  0.0000	  6714.2949	 11.06	172.61	   99.93%	  4096	    7.2487	 60.41%	      0.37%	  0.9866
+   10	attn_k              	  43706.77	  0.0000	  6960.2920	 10.67	180.78	   99.93%	  4096	    6.7438	 56.20%	      0.34%	  0.9923
+    2	attn_k              	  19532.52	  0.0000	  6018.6182	  4.77	 99.81	   99.90%	  4096	    7.6636	 63.86%	      0.20%	  0.3212
+    3	attn_k              	  17324.65	  0.0000	  5779.3477	  4.23	110.43	   99.93%	  4096	    5.5684	 46.40%	      0.22%	  0.9580
+    1	attn_k              	  15856.24	  0.0000	  5183.1831	  3.87	 86.07	   98.66%	  4096	    6.6712	 55.59%	      0.22%	  0.3483
+    0	attn_k              	   3049.93	  0.0000	   247.0233	  0.74	  7.67	   97.14%	  4096	    6.8129	 56.77%	      1.12%	  0.0000
+   39	attn_output         	  34614.42	  1.0529	   359.3260	  8.45	 11.78	  100.00%	  4096	   11.3365	 94.47%	      7.59%	  0.3770
+   38	attn_output         	  13420.36	  0.2976	   103.0346	  3.28	  4.13	  100.00%	  4096	   11.3248	 94.37%	      8.98%	  0.2804
+   37	attn_output         	   8831.00	  0.2297	   108.9257	  2.16	  3.37	  100.00%	  4096	   11.2679	 93.90%	      5.49%	  0.2283
+   36	attn_output         	   8013.26	  0.1413	    95.6638	  1.96	  3.93	  100.00%	  4096	   11.0147	 91.79%	      4.32%	  0.2457
+   35	attn_output         	   3675.13	  0.1878	    48.8232	  0.90	  1.65	  100.00%	  4096	   11.2243	 93.54%	      4.52%	  0.2357
+   34	attn_output         	   3483.17	  0.0606	    33.0821	  0.85	  1.59	  100.00%	  4096	   11.1613	 93.01%	      3.96%	  0.1202
+   33	attn_output         	   3199.42	  0.0368	   114.1278	  0.78	  2.50	  100.00%	  4096	   10.6861	 89.05%	      3.47%	  0.1774
+   31	attn_output         	   2234.35	  0.0523	    41.9673	  0.55	  1.30	  100.00%	  4096	   10.8825	 90.69%	      5.00%	  0.2217
+    1	attn_output         	   1997.94	  0.0106	    18.5997	  0.49	  0.98	  100.00%	  4096	   10.5931	 88.28%	     10.03%	  0.0200
+    2	attn_output         	   1738.62	  0.0199	     8.3539	  0.42	  0.55	  100.00%	  4096	   11.1150	 92.63%	     16.77%	  0.3314
+   32	attn_output         	   1524.28	  0.0124	    13.4450	  0.37	  0.70	  100.00%	  4096	   11.1955	 93.30%	      3.03%	  0.1768
+   30	attn_output         	   1314.30	  0.0875	     9.0597	  0.32	  0.51	  100.00%	  4096	   11.3404	 94.50%	      3.64%	  0.2404
+   28	attn_output         	   1114.76	  0.0367	    12.3692	  0.27	  0.65	  100.00%	  4096	   10.8974	 90.81%	      3.59%	  0.1806
+    3	attn_output         	   1080.53	  0.0156	     5.2009	  0.26	  0.36	  100.00%	  4096	   11.1964	 93.30%	     10.28%	  0.2966
+   24	attn_output         	    914.61	  0.0400	     6.5156	  0.22	  0.32	  100.00%	  4096	   11.3443	 94.54%	      6.69%	  0.1864
+   23	attn_output         	    900.86	  0.0061	    16.3921	  0.22	  0.55	  100.00%	  4096	   10.9512	 91.26%	      3.27%	  0.1833
+   29	attn_output         	    868.15	  0.0168	     8.5233	  0.21	  0.45	  100.00%	  4096	   11.0238	 91.87%	      4.83%	  0.1848
+   27	attn_output         	    855.07	  0.0081	     8.6770	  0.21	  0.41	  100.00%	  4096	   11.1371	 92.81%	      3.39%	  0.2051
+   22	attn_output         	    812.40	  0.0144	     7.8408	  0.20	  0.37	  100.00%	  4096	   11.1740	 93.12%	      3.88%	  0.2016
+   17	attn_output         	    711.99	  0.0085	     4.7093	  0.17	  0.28	  100.00%	  4096	   11.1963	 93.30%	      4.81%	  0.2343
+   21	attn_output         	    709.29	  0.0000	    10.5542	  0.17	  0.37	  100.00%	  4096	   10.9892	 91.58%	      4.57%	  0.1817
+   19	attn_output         	    707.10	  0.0186	     6.2341	  0.17	  0.23	  100.00%	  4096	   11.4981	 95.82%	      3.22%	  0.2283
+   20	attn_output         	    703.72	  0.0083	     5.4485	  0.17	  0.28	  100.00%	  4096	   11.2945	 94.12%	      3.93%	  0.2992
+   25	attn_output         	    656.68	  0.0052	    10.7580	  0.16	  0.38	  100.00%	  4096	   11.0354	 91.96%	      2.08%	  0.2214
+   15	attn_output         	    646.34	  0.0052	     8.5272	  0.16	  0.29	  100.00%	  4096	   11.0779	 92.32%	      6.45%	  0.2046
+   16	attn_output         	    610.13	  0.0001	     6.2649	  0.15	  0.35	  100.00%	  4096	   10.7437	 89.53%	      3.83%	  0.1555
+   26	attn_output         	    609.93	  0.0232	     5.7634	  0.15	  0.28	  100.00%	  4096	   11.2354	 93.63%	      3.52%	  0.1915
+   13	attn_output         	    548.35	  0.0033	     4.0648	  0.13	  0.21	  100.00%	  4096	   10.8651	 90.54%	     12.60%	  0.4666
+   18	attn_output         	    516.94	  0.0000	    10.2987	  0.13	  0.28	   99.76%	  4096	   11.0928	 92.44%	      2.69%	  0.2541
+    4	attn_output         	    453.05	  0.0051	     3.9059	  0.11	  0.15	  100.00%	  4096	   11.3247	 94.37%	      8.91%	  0.3225
+    0	attn_output         	    447.61	  0.0008	    91.7077	  0.11	  1.72	  100.00%	  4096	    6.9468	 57.89%	      0.73%	  0.0000
+   10	attn_output         	    439.24	  0.0036	     3.4716	  0.11	  0.26	  100.00%	  4096	   10.4123	 86.77%	      7.06%	  0.2021
+   11	attn_output         	    401.22	  0.0051	     1.9410	  0.10	  0.15	  100.00%	  4096	   11.0397	 92.00%	     10.16%	  0.1149
+   14	attn_output         	    350.10	  0.0024	     3.9673	  0.09	  0.14	  100.00%	  4096	   11.0800	 92.33%	      6.81%	  0.2386
+    5	attn_output         	    296.64	  0.0028	     3.5316	  0.07	  0.11	  100.00%	  4096	   11.1694	 93.08%	      6.15%	  0.2990
+    7	attn_output         	    240.15	  0.0033	     3.3802	  0.06	  0.11	  100.00%	  4096	   11.1050	 92.54%	      5.96%	  0.3540
+    6	attn_output         	    218.34	  0.0015	     1.1016	  0.05	  0.07	  100.00%	  4096	   11.2492	 93.74%	     10.18%	  0.2733
+    8	attn_output         	    208.74	  0.0015	     5.2777	  0.05	  0.12	  100.00%	  4096	   10.9654	 91.38%	      5.47%	  0.1650
+   12	attn_output         	    208.53	  0.0032	     2.3583	  0.05	  0.07	  100.00%	  4096	   11.4232	 95.19%	      9.01%	  0.3528
+    9	attn_output         	    151.65	  0.0025	     1.4596	  0.04	  0.05	  100.00%	  4096	   11.3319	 94.43%	      6.32%	  0.2434
+   39	attn_q              	 174643.00	  2.0243	 18914.7031	 42.64	497.38	  100.00%	  4096	    8.8904	 74.09%	      0.37%	  0.8865
+   38	attn_q              	 166087.69	  0.0000	 20050.7402	 40.55	448.81	   99.98%	  4096	    8.6133	 71.78%	      0.46%	  0.9835
+   37	attn_q              	 146614.73	  0.7595	 20756.5176	 35.79	423.56	  100.00%	  4096	    8.3834	 69.86%	      0.44%	  0.9842
+   36	attn_q              	 134513.23	  0.5200	 19003.3398	 32.84	386.52	  100.00%	  4096	    8.2079	 68.40%	      0.51%	  0.9501
+   35	attn_q              	 124035.38	  1.3198	 11533.5068	 30.28	305.84	  100.00%	  4096	    8.2914	 69.09%	      0.71%	  0.9665
+   34	attn_q              	 123896.47	  0.5387	 17763.3496	 30.25	472.60	  100.00%	  4096	    6.6833	 55.69%	      0.44%	  0.9800
+   32	attn_q              	 111128.92	  0.1590	 25305.4961	 27.13	504.76	  100.00%	  4096	    6.2867	 52.39%	      0.37%	  0.9931
+   30	attn_q              	 109705.93	  0.0000	 33505.8359	 26.78	617.29	   99.98%	  4096	    5.4138	 45.11%	      0.27%	  0.9759
+   33	attn_q              	 109045.48	  0.9963	 20537.8262	 26.62	448.68	  100.00%	  4096	    6.6424	 55.35%	      0.37%	  0.9914
+   29	attn_q              	  87316.21	  0.0000	 20308.4004	 21.32	398.84	   99.95%	  4096	    6.1991	 51.66%	      0.37%	  0.9936
+   31	attn_q              	  87185.37	  0.0000	 22471.5254	 21.29	421.05	   99.98%	  4096	    6.2130	 51.78%	      0.34%	  0.9963
+   28	attn_q              	  82016.98	  0.0000	 23024.2656	 20.02	430.64	   99.95%	  4096	    5.6830	 47.36%	      0.29%	  0.9976
+   27	attn_q              	  76821.73	  0.0000	 17911.5156	 18.76	348.43	   99.98%	  4096	    6.3444	 52.87%	      0.34%	  0.9791
+   16	attn_q              	  76133.66	  0.0000	 11891.1016	 18.59	311.73	   99.93%	  4096	    6.1208	 51.01%	      0.42%	  0.9643
+   23	attn_q              	  74987.37	  0.0000	 18502.6172	 18.31	356.15	   99.95%	  4096	    6.1167	 50.97%	      0.39%	  0.9980
+   22	attn_q              	  71226.52	  0.0000	 18282.5273	 17.39	343.00	   99.98%	  4096	    6.2861	 52.38%	      0.32%	  0.9901
+   21	attn_q              	  69479.59	  0.0000	 14531.5439	 16.96	297.70	   99.95%	  4096	    6.6280	 55.23%	      0.39%	  0.9882
+   20	attn_q              	  68286.74	  0.0000	 18747.7070	 16.67	345.57	   99.95%	  4096	    6.0506	 50.42%	      0.34%	  0.9917
+   25	attn_q              	  68221.13	  0.0000	 14562.2783	 16.66	294.34	   99.98%	  4096	    6.3805	 53.17%	      0.39%	  0.9829
+    7	attn_q              	  68092.71	  0.0000	 17005.3926	 16.62	348.43	   99.90%	  4096	    5.9826	 49.85%	      0.32%	  0.9814
+   18	attn_q              	  66295.24	  0.0000	 12255.0391	 16.19	262.31	   99.95%	  4096	    6.9157	 57.63%	      0.42%	  0.9978
+   26	attn_q              	  65291.02	  0.0000	 12545.3467	 15.94	268.54	   99.98%	  4096	    6.6067	 55.06%	      0.39%	  0.9920
+   13	attn_q              	  59896.29	  0.0000	  8712.0469	 14.62	232.75	   99.90%	  4096	    6.9162	 57.63%	      0.32%	  0.9786
+   24	attn_q              	  56921.47	  0.0000	  9241.3613	 13.90	213.49	   99.98%	  4096	    7.0602	 58.84%	      0.54%	  0.9757
+   17	attn_q              	  56760.55	  0.0000	 10113.2490	 13.86	223.49	   99.95%	  4096	    6.7278	 56.06%	      0.44%	  0.9569
+   15	attn_q              	  55194.11	  0.0000	  9697.7783	 13.48	229.94	   99.93%	  4096	    5.9460	 49.55%	      0.37%	  0.9288
+   14	attn_q              	  54794.45	  0.0000	  8291.7021	 13.38	212.09	   99.90%	  4096	    7.0371	 58.64%	      0.37%	  0.9885
+    6	attn_q              	  53044.36	  0.0000	 16721.8047	 12.95	321.79	   99.88%	  4096	    4.5291	 37.74%	      0.32%	  0.9479
+   19	attn_q              	  52733.22	  0.0000	 11920.8223	 12.87	233.97	   99.95%	  4096	    6.5100	 54.25%	      0.39%	  0.9902
+    8	attn_q              	  51986.04	  0.0000	 10429.2197	 12.69	233.14	   99.90%	  4096	    6.5500	 54.58%	      0.29%	  0.9699
+    9	attn_q              	  49641.15	  0.0000	 10131.9502	 12.12	241.91	   99.90%	  4096	    5.8877	 49.06%	      0.34%	  0.9950
+   12	attn_q              	  48607.36	  0.0000	  7781.5098	 11.87	191.06	   99.93%	  4096	    7.0521	 58.77%	      0.37%	  0.9965
+    4	attn_q              	  46316.68	  0.0000	 16862.5684	 11.31	309.35	   99.85%	  4096	    5.2333	 43.61%	      0.22%	  0.7166
+    5	attn_q              	  45620.26	  0.0000	 16766.0762	 11.14	317.06	   99.88%	  4096	    4.5011	 37.51%	      0.22%	  0.9947
+   11	attn_q              	  45317.79	  0.0000	  6714.2949	 11.06	172.61	   99.93%	  4096	    7.2487	 60.41%	      0.37%	  0.9866
+   10	attn_q              	  43706.77	  0.0000	  6960.2920	 10.67	180.78	   99.93%	  4096	    6.7438	 56.20%	      0.34%	  0.9923
+    2	attn_q              	  19532.52	  0.0000	  6018.6182	  4.77	 99.81	   99.90%	  4096	    7.6636	 63.86%	      0.20%	  0.3212
+    3	attn_q              	  17324.65	  0.0000	  5779.3477	  4.23	110.43	   99.93%	  4096	    5.5684	 46.40%	      0.22%	  0.9580
+    1	attn_q              	  15856.24	  0.0000	  5183.1831	  3.87	 86.07	   98.66%	  4096	    6.6712	 55.59%	      0.22%	  0.3483
+    0	attn_q              	   3049.93	  0.0000	   247.0233	  0.74	  7.67	   97.14%	  4096	    6.8129	 56.77%	      1.12%	  0.0000
+   39	attn_v              	 174643.00	  2.0243	 18914.7031	 42.64	497.38	  100.00%	  4096	    8.8904	 74.09%	      0.37%	  0.8865
+   38	attn_v              	 166087.69	  0.0000	 20050.7402	 40.55	448.81	   99.98%	  4096	    8.6133	 71.78%	      0.46%	  0.9835
+   37	attn_v              	 146614.73	  0.7595	 20756.5176	 35.79	423.56	  100.00%	  4096	    8.3834	 69.86%	      0.44%	  0.9842
+   36	attn_v              	 134513.23	  0.5200	 19003.3398	 32.84	386.52	  100.00%	  4096	    8.2079	 68.40%	      0.51%	  0.9501
+   35	attn_v              	 124035.38	  1.3198	 11533.5068	 30.28	305.84	  100.00%	  4096	    8.2914	 69.09%	      0.71%	  0.9665
+   34	attn_v              	 123896.47	  0.5387	 17763.3496	 30.25	472.60	  100.00%	  4096	    6.6833	 55.69%	      0.44%	  0.9800
+   32	attn_v              	 111128.92	  0.1590	 25305.4961	 27.13	504.76	  100.00%	  4096	    6.2867	 52.39%	      0.37%	  0.9931
+   30	attn_v              	 109705.93	  0.0000	 33505.8359	 26.78	617.29	   99.98%	  4096	    5.4138	 45.11%	      0.27%	  0.9759
+   33	attn_v              	 109045.48	  0.9963	 20537.8262	 26.62	448.68	  100.00%	  4096	    6.6424	 55.35%	      0.37%	  0.9914
+   29	attn_v              	  87316.21	  0.0000	 20308.4004	 21.32	398.84	   99.95%	  4096	    6.1991	 51.66%	      0.37%	  0.9936
+   31	attn_v              	  87185.37	  0.0000	 22471.5254	 21.29	421.05	   99.98%	  4096	    6.2130	 51.78%	      0.34%	  0.9963
+   28	attn_v              	  82016.98	  0.0000	 23024.2656	 20.02	430.64	   99.95%	  4096	    5.6830	 47.36%	      0.29%	  0.9976
+   27	attn_v              	  76821.73	  0.0000	 17911.5156	 18.76	348.43	   99.98%	  4096	    6.3444	 52.87%	      0.34%	  0.9791
+   16	attn_v              	  76133.66	  0.0000	 11891.1016	 18.59	311.73	   99.93%	  4096	    6.1208	 51.01%	      0.42%	  0.9643
+   23	attn_v              	  74987.37	  0.0000	 18502.6172	 18.31	356.15	   99.95%	  4096	    6.1167	 50.97%	      0.39%	  0.9980
+   22	attn_v              	  71226.52	  0.0000	 18282.5273	 17.39	343.00	   99.98%	  4096	    6.2861	 52.38%	      0.32%	  0.9901
+   21	attn_v              	  69479.59	  0.0000	 14531.5439	 16.96	297.70	   99.95%	  4096	    6.6280	 55.23%	      0.39%	  0.9882
+   20	attn_v              	  68286.74	  0.0000	 18747.7070	 16.67	345.57	   99.95%	  4096	    6.0506	 50.42%	      0.34%	  0.9917
+   25	attn_v              	  68221.13	  0.0000	 14562.2783	 16.66	294.34	   99.98%	  4096	    6.3805	 53.17%	      0.39%	  0.9829
+    7	attn_v              	  68092.71	  0.0000	 17005.3926	 16.62	348.43	   99.90%	  4096	    5.9826	 49.85%	      0.32%	  0.9814
+   18	attn_v              	  66295.24	  0.0000	 12255.0391	 16.19	262.31	   99.95%	  4096	    6.9157	 57.63%	      0.42%	  0.9978
+   26	attn_v              	  65291.02	  0.0000	 12545.3467	 15.94	268.54	   99.98%	  4096	    6.6067	 55.06%	      0.39%	  0.9920
+   13	attn_v              	  59896.29	  0.0000	  8712.0469	 14.62	232.75	   99.90%	  4096	    6.9162	 57.63%	      0.32%	  0.9786
+   24	attn_v              	  56921.47	  0.0000	  9241.3613	 13.90	213.49	   99.98%	  4096	    7.0602	 58.84%	      0.54%	  0.9757
+   17	attn_v              	  56760.55	  0.0000	 10113.2490	 13.86	223.49	   99.95%	  4096	    6.7278	 56.06%	      0.44%	  0.9569
+   15	attn_v              	  55194.11	  0.0000	  9697.7783	 13.48	229.94	   99.93%	  4096	    5.9460	 49.55%	      0.37%	  0.9288
+   14	attn_v              	  54794.45	  0.0000	  8291.7021	 13.38	212.09	   99.90%	  4096	    7.0371	 58.64%	      0.37%	  0.9885
+    6	attn_v              	  53044.36	  0.0000	 16721.8047	 12.95	321.79	   99.88%	  4096	    4.5291	 37.74%	      0.32%	  0.9479
+   19	attn_v              	  52733.22	  0.0000	 11920.8223	 12.87	233.97	   99.95%	  4096	    6.5100	 54.25%	      0.39%	  0.9902
+    8	attn_v              	  51986.04	  0.0000	 10429.2197	 12.69	233.14	   99.90%	  4096	    6.5500	 54.58%	      0.29%	  0.9699
+    9	attn_v              	  49641.15	  0.0000	 10131.9502	 12.12	241.91	   99.90%	  4096	    5.8877	 49.06%	      0.34%	  0.9950
+   12	attn_v              	  48607.36	  0.0000	  7781.5098	 11.87	191.06	   99.93%	  4096	    7.0521	 58.77%	      0.37%	  0.9965
+    4	attn_v              	  46316.68	  0.0000	 16862.5684	 11.31	309.35	   99.85%	  4096	    5.2333	 43.61%	      0.22%	  0.7166
+    5	attn_v              	  45620.26	  0.0000	 16766.0762	 11.14	317.06	   99.88%	  4096	    4.5011	 37.51%	      0.22%	  0.9947
+   11	attn_v              	  45317.79	  0.0000	  6714.2949	 11.06	172.61	   99.93%	  4096	    7.2487	 60.41%	      0.37%	  0.9866
+   10	attn_v              	  43706.77	  0.0000	  6960.2920	 10.67	180.78	   99.93%	  4096	    6.7438	 56.20%	      0.34%	  0.9923
+    2	attn_v              	  19532.52	  0.0000	  6018.6182	  4.77	 99.81	   99.90%	  4096	    7.6636	 63.86%	      0.20%	  0.3212
+    3	attn_v              	  17324.65	  0.0000	  5779.3477	  4.23	110.43	   99.93%	  4096	    5.5684	 46.40%	      0.22%	  0.9580
+    1	attn_v              	  15856.24	  0.0000	  5183.1831	  3.87	 86.07	   98.66%	  4096	    6.6712	 55.59%	      0.22%	  0.3483
+    0	attn_v              	   3049.93	  0.0000	   247.0233	  0.74	  7.67	   97.14%	  4096	    6.8129	 56.77%	      1.12%	  0.0000
+   39	ffn_down            	1645556.38	  0.0689	 81837.1094	128.56	1422.92	  100.00%	 12800	    9.8110	 71.91%	      1.00%	  0.0173
+    5	ffn_down            	 381550.03	  0.0094	210713.1406	 29.81	2109.55	  100.00%	 12800	    1.6182	 11.86%	      0.03%	  0.0011
+   38	ffn_down            	 242713.44	  0.2437	  7073.1206	 18.96	 84.75	  100.00%	 12800	   12.6848	 92.97%	      0.70%	  0.0476
+    3	ffn_down            	 188951.92	  0.0109	147793.5938	 14.76	1332.36	  100.00%	 12800	    1.2131	  8.89%	      0.03%	  0.0026
+   37	ffn_down            	 142317.03	  0.0870	  5205.8745	 11.12	 52.73	  100.00%	 12800	   12.6322	 92.59%	      0.67%	  0.0329
+   36	ffn_down            	  83945.62	  0.0217	  2698.7646	  6.56	 37.12	  100.00%	 12800	   11.9912	 87.89%	      1.06%	  0.0443
+   35	ffn_down            	  42474.45	  0.0859	   952.5922	  3.32	 13.19	  100.00%	 12800	   12.1797	 89.27%	      2.48%	  0.0830
+   34	ffn_down            	  26102.06	  0.0438	   229.3722	  2.04	  5.52	  100.00%	 12800	   12.2821	 90.02%	      4.28%	  0.1049
+   33	ffn_down            	  12264.68	  0.0564	   152.2174	  0.96	  2.91	  100.00%	 12800	   12.2756	 89.97%	      3.31%	  0.0943
+    0	ffn_down            	   6042.44	  0.0000	  2911.0620	  0.47	 25.98	  100.00%	 12800	    5.6061	 41.09%	      0.12%	  0.0000
+   32	ffn_down            	   5920.96	  0.0421	    99.5476	  0.46	  1.42	  100.00%	 12800	   12.4740	 91.43%	      3.20%	  0.0558
+   31	ffn_down            	   3874.26	  0.0193	   185.5614	  0.30	  1.72	  100.00%	 12800	   12.4092	 90.95%	      1.28%	  0.0903
+   30	ffn_down            	   3486.52	  0.0333	    71.5827	  0.27	  0.87	  100.00%	 12800	   12.5027	 91.64%	      2.80%	  0.0724
+   29	ffn_down            	   2260.60	  0.0105	    59.7711	  0.18	  0.70	  100.00%	 12800	   12.4988	 91.61%	      1.99%	  0.0480
+    2	ffn_down            	   1941.90	  0.0007	   217.4457	  0.15	  1.95	  100.00%	 12800	   11.9799	 87.80%	      0.16%	  0.0440
+   28	ffn_down            	   1810.21	  0.0343	    70.6592	  0.14	  0.70	  100.00%	 12800	   12.6709	 92.87%	      0.97%	  0.0639
+    1	ffn_down            	   1559.32	  0.0002	    17.3429	  0.12	  0.21	  100.00%	 12800	   13.0362	 95.55%	      5.21%	  0.0058
+   27	ffn_down            	   1505.68	  0.0334	    16.9273	  0.12	  0.33	  100.00%	 12800	   12.8432	 94.13%	      1.88%	  0.0300
+   23	ffn_down            	   1423.83	  0.0149	    23.6004	  0.11	  0.42	  100.00%	 12800	   12.5741	 92.16%	      1.63%	  0.0554
+   24	ffn_down            	   1422.49	  0.0148	    57.0210	  0.11	  0.56	  100.00%	 12800	   12.6908	 93.01%	      0.84%	  0.0463
+   26	ffn_down            	   1401.04	  0.0277	   123.4429	  0.11	  1.10	  100.00%	 12800	   12.4077	 90.94%	      0.29%	  0.0151
+   25	ffn_down            	   1375.32	  0.0282	    80.1291	  0.11	  0.74	  100.00%	 12800	   12.6175	 92.48%	      0.48%	  0.0268
+   22	ffn_down            	   1156.34	  0.0120	    34.4371	  0.09	  0.38	  100.00%	 12800	   12.6976	 93.06%	      1.30%	  0.0673
+   21	ffn_down            	   1138.10	  0.0147	    24.3792	  0.09	  0.28	  100.00%	 12800	   12.7839	 93.70%	      2.28%	  0.0947
+   20	ffn_down            	   1136.30	  0.0127	    21.3931	  0.09	  0.26	  100.00%	 12800	   12.8313	 94.04%	      2.33%	  0.1177
+   18	ffn_down            	   1119.47	  0.0176	     4.8772	  0.09	  0.14	  100.00%	 12800	   12.9995	 95.28%	      5.52%	  0.2902
+   19	ffn_down            	   1116.88	  0.0151	    20.6434	  0.09	  0.23	  100.00%	 12800	   12.9391	 94.83%	      2.98%	  0.1868
+   16	ffn_down            	   1105.64	  0.0134	    17.2072	  0.09	  0.19	  100.00%	 12800	   13.0591	 95.71%	      3.31%	  0.0832
+   17	ffn_down            	   1041.27	  0.0162	     9.5109	  0.08	  0.13	  100.00%	 12800	   13.1452	 96.34%	      4.94%	  0.2264
+   15	ffn_down            	   1024.12	  0.0230	    43.3770	  0.08	  0.40	  100.00%	 12800	   12.7413	 93.39%	      1.24%	  0.0284
+    6	ffn_down            	   1022.13	  0.0078	   352.7156	  0.08	  3.12	  100.00%	 12800	    9.2787	 68.01%	      0.05%	  0.0001
+   14	ffn_down            	    951.70	  0.0253	    49.8595	  0.07	  0.50	  100.00%	 12800	   12.6100	 92.42%	      0.50%	  0.0720
+   11	ffn_down            	    926.64	  0.0218	    12.4872	  0.07	  0.13	  100.00%	 12800	   13.2980	 97.47%	      1.80%	  0.2713
+    4	ffn_down            	    923.82	  0.0080	    22.2460	  0.07	  0.37	  100.00%	 12800	   12.2201	 89.57%	      1.02%	  0.0012
+   12	ffn_down            	    888.91	  0.0240	     7.9189	  0.07	  0.12	  100.00%	 12800	   13.2283	 96.95%	      2.80%	  0.2412
+   10	ffn_down            	    857.79	  0.0211	     5.1418	  0.07	  0.10	  100.00%	 12800	   13.1941	 96.70%	      3.75%	  0.1709
+   13	ffn_down            	    845.87	  0.0263	     8.8175	  0.07	  0.11	  100.00%	 12800	   13.2368	 97.02%	      2.59%	  0.2583
+    9	ffn_down            	    829.72	  0.0127	    11.8182	  0.06	  0.21	  100.00%	 12800	   12.6312	 92.58%	      1.71%	  0.1047
+    7	ffn_down            	    761.20	  0.0088	    17.7730	  0.06	  0.18	  100.00%	 12800	   13.0089	 95.35%	      1.20%	  0.0092
+    8	ffn_down            	    714.58	  0.0115	     9.3180	  0.06	  0.15	  100.00%	 12800	   12.9415	 94.85%	      1.95%	  0.1090
+   39	ffn_gate            	  73855.20	  0.0000	 27529.4883	 18.03	432.89	   99.98%	  4096	    7.6055	 63.38%	      0.27%	  0.9793
+   38	ffn_gate            	  29146.70	  0.0000	  3154.5896	  7.12	 50.92	   99.98%	  4096	   10.6959	 89.13%	      0.63%	  0.9972
+   37	ffn_gate            	  23469.74	  0.0000	  1999.8401	  5.73	 32.33	  100.00%	  4096	   11.0207	 91.84%	      0.66%	  0.9944
+   36	ffn_gate            	  18879.52	  0.0000	  1587.3755	  4.61	 26.11	   99.98%	  4096	   10.9542	 91.28%	      0.68%	  0.9535
+   35	ffn_gate            	  12609.52	  0.0000	   691.8613	  3.08	 13.18	   99.95%	  4096	   10.9728	 91.44%	      1.10%	  0.7708
+   34	ffn_gate            	   9369.36	  0.0000	   369.9386	  2.29	  8.82	   99.98%	  4096	   10.8088	 90.07%	      1.39%	  0.9703
+   33	ffn_gate            	   6623.49	  0.0000	   206.4922	  1.62	  5.04	   99.98%	  4096	   11.0320	 91.93%	      1.56%	  0.9570
+   32	ffn_gate            	   4946.19	  0.2047	   142.2780	  1.21	  3.44	  100.00%	  4096	   11.1646	 93.04%	      1.49%	  0.8361
+    0	ffn_gate            	   4647.99	  0.0000	   530.0613	  1.13	 10.15	   68.41%	  4096	    8.6122	 71.77%	      1.15%	  0.0000
+   31	ffn_gate            	   4116.51	  0.0000	   180.2167	  1.01	  3.74	   99.98%	  4096	   11.0407	 92.01%	      1.32%	  0.5779
+    1	ffn_gate            	   3766.61	  0.0000	   642.9065	  0.92	 11.02	   99.22%	  4096	    9.7890	 81.57%	      0.12%	  0.0923
+   30	ffn_gate            	   3736.23	  0.0000	    93.6410	  0.91	  2.60	  100.00%	  4096	   11.2482	 93.73%	      1.29%	  0.9941
+   29	ffn_gate            	   3591.15	  0.0000	    88.1915	  0.88	  2.41	   99.98%	  4096	   11.3407	 94.51%	      1.10%	  0.9684
+   25	ffn_gate            	   3420.11	  0.0000	    73.2920	  0.83	  2.34	   99.98%	  4096	   11.3321	 94.43%	      0.85%	  0.9818
+   12	ffn_gate            	   3417.91	  0.0000	    98.0158	  0.83	  1.89	   99.95%	  4096	   11.6038	 96.70%	      0.49%	  0.9870
+   26	ffn_gate            	   3406.55	  0.0000	    75.7852	  0.83	  2.13	   99.98%	  4096	   11.4214	 95.18%	      0.88%	  0.9927
+   13	ffn_gate            	   3312.10	  0.0000	    90.1448	  0.81	  1.61	   99.98%	  4096	   11.6814	 97.34%	      0.51%	  0.9759
+   11	ffn_gate            	   3301.55	  0.0000	   105.7369	  0.81	  2.04	   99.95%	  4096	   11.5318	 96.10%	      0.44%	  0.9904
+   28	ffn_gate            	   3275.83	  0.0000	    68.6310	  0.80	  1.93	   99.98%	  4096	   11.4178	 95.15%	      1.22%	  0.9578
+   27	ffn_gate            	   3236.11	  0.0000	    72.2997	  0.79	  1.87	   99.98%	  4096	   11.4812	 95.68%	      1.03%	  0.9950
+   14	ffn_gate            	   3080.71	  0.0000	    65.3723	  0.75	  1.33	   99.98%	  4096	   11.6985	 97.49%	      0.71%	  0.9506
+   16	ffn_gate            	   3016.78	  0.0000	    55.2134	  0.74	  1.58	   99.98%	  4096	   11.5581	 96.32%	      0.76%	  0.9874
+   24	ffn_gate            	   3010.61	  0.0000	    73.8905	  0.74	  2.21	  100.00%	  4096	   11.2557	 93.80%	      0.93%	  0.9690
+   22	ffn_gate            	   2879.76	  0.0001	    77.3697	  0.70	  2.02	  100.00%	  4096	   11.3401	 94.50%	      0.81%	  0.9957
+   17	ffn_gate            	   2870.70	  0.0000	    51.7692	  0.70	  1.48	   99.98%	  4096	   11.5662	 96.39%	      0.73%	  0.9959
+   23	ffn_gate            	   2843.65	  0.0001	    89.6189	  0.69	  2.21	  100.00%	  4096	   11.2398	 93.66%	      0.95%	  0.9937
+   10	ffn_gate            	   2833.02	  0.0000	    85.4598	  0.69	  1.74	   99.90%	  4096	   11.5267	 96.06%	      0.46%	  0.8381
+   19	ffn_gate            	   2776.20	  0.0000	    70.3380	  0.68	  1.86	  100.00%	  4096	   11.3917	 94.93%	      0.71%	  0.9944
+   15	ffn_gate            	   2760.72	  0.0000	    57.4514	  0.67	  1.45	   99.95%	  4096	   11.5659	 96.38%	      0.83%	  0.9038
+   18	ffn_gate            	   2754.00	  0.0001	    61.1560	  0.67	  1.55	  100.00%	  4096	   11.5243	 96.04%	      0.76%	  0.9902
+   21	ffn_gate            	   2737.92	  0.0000	    70.9311	  0.67	  1.86	   99.98%	  4096	   11.3741	 94.78%	      0.81%	  0.9902
+   20	ffn_gate            	   2699.39	  0.0000	    65.5763	  0.66	  1.79	   99.98%	  4096	   11.3889	 94.91%	      0.83%	  0.9932
+    8	ffn_gate            	   2469.90	  0.0000	   103.2819	  0.60	  1.84	   99.93%	  4096	   11.4803	 95.67%	      0.56%	  0.9061
+    2	ffn_gate            	   2319.60	  0.0000	   630.8475	  0.57	 10.17	   99.80%	  4096	    8.7421	 72.85%	      0.12%	  0.0200
+    9	ffn_gate            	   2312.98	  0.0000	    70.3176	  0.56	  1.47	   99.93%	  4096	   11.4845	 95.70%	      0.76%	  0.9660
+    7	ffn_gate            	   2253.67	  0.0000	    58.9012	  0.55	  1.44	   99.93%	  4096	   11.5263	 96.05%	      0.54%	  0.9532
+    5	ffn_gate            	   2213.64	  0.0000	   330.8649	  0.54	  5.46	   99.93%	  4096	   10.0780	 83.98%	      0.24%	  0.2463
+    6	ffn_gate            	   1791.24	  0.0000	    42.9261	  0.44	  1.12	   99.90%	  4096	   11.4775	 95.65%	      0.66%	  0.2691
+    4	ffn_gate            	   1789.65	  0.0000	   112.6252	  0.44	  2.11	   99.93%	  4096	   11.0733	 92.28%	      0.29%	  0.9765
+    3	ffn_gate            	   1716.85	  0.0000	   175.6357	  0.42	  3.39	   99.90%	  4096	   10.3538	 86.28%	      0.22%	  0.8606
+   39	ffn_up              	  73855.20	  0.0000	 27529.4883	 18.03	432.89	   99.98%	  4096	    7.6055	 63.38%	      0.27%	  0.9793
+   38	ffn_up              	  29146.70	  0.0000	  3154.5896	  7.12	 50.92	   99.98%	  4096	   10.6959	 89.13%	      0.63%	  0.9972
+   37	ffn_up              	  23469.74	  0.0000	  1999.8401	  5.73	 32.33	  100.00%	  4096	   11.0207	 91.84%	      0.66%	  0.9944
+   36	ffn_up              	  18879.52	  0.0000	  1587.3755	  4.61	 26.11	   99.98%	  4096	   10.9542	 91.28%	      0.68%	  0.9535
+   35	ffn_up              	  12609.52	  0.0000	   691.8613	  3.08	 13.18	   99.95%	  4096	   10.9728	 91.44%	      1.10%	  0.7708
+   34	ffn_up              	   9369.36	  0.0000	   369.9386	  2.29	  8.82	   99.98%	  4096	   10.8088	 90.07%	      1.39%	  0.9703
+   33	ffn_up              	   6623.49	  0.0000	   206.4922	  1.62	  5.04	   99.98%	  4096	   11.0320	 91.93%	      1.56%	  0.9570
+   32	ffn_up              	   4946.19	  0.2047	   142.2780	  1.21	  3.44	  100.00%	  4096	   11.1646	 93.04%	      1.49%	  0.8361
+    0	ffn_up              	   4647.99	  0.0000	   530.0613	  1.13	 10.15	   68.41%	  4096	    8.6122	 71.77%	      1.15%	  0.0000
+   31	ffn_up              	   4116.51	  0.0000	   180.2167	  1.01	  3.74	   99.98%	  4096	   11.0407	 92.01%	      1.32%	  0.5779
+    1	ffn_up              	   3766.61	  0.0000	   642.9065	  0.92	 11.02	   99.22%	  4096	    9.7890	 81.57%	      0.12%	  0.0923
+   30	ffn_up              	   3736.23	  0.0000	    93.6410	  0.91	  2.60	  100.00%	  4096	   11.2482	 93.73%	      1.29%	  0.9941
+   29	ffn_up              	   3591.15	  0.0000	    88.1915	  0.88	  2.41	   99.98%	  4096	   11.3407	 94.51%	      1.10%	  0.9684
+   25	ffn_up              	   3420.11	  0.0000	    73.2920	  0.83	  2.34	   99.98%	  4096	   11.3321	 94.43%	      0.85%	  0.9818
+   12	ffn_up              	   3417.91	  0.0000	    98.0158	  0.83	  1.89	   99.95%	  4096	   11.6038	 96.70%	      0.49%	  0.9870
+   26	ffn_up              	   3406.55	  0.0000	    75.7852	  0.83	  2.13	   99.98%	  4096	   11.4214	 95.18%	      0.88%	  0.9927
+   13	ffn_up              	   3312.10	  0.0000	    90.1448	  0.81	  1.61	   99.98%	  4096	   11.6814	 97.34%	      0.51%	  0.9759
+   11	ffn_up              	   3301.55	  0.0000	   105.7369	  0.81	  2.04	   99.95%	  4096	   11.5318	 96.10%	      0.44%	  0.9904
+   28	ffn_up              	   3275.83	  0.0000	    68.6310	  0.80	  1.93	   99.98%	  4096	   11.4178	 95.15%	      1.22%	  0.9578
+   27	ffn_up              	   3236.11	  0.0000	    72.2997	  0.79	  1.87	   99.98%	  4096	   11.4812	 95.68%	      1.03%	  0.9950
+   14	ffn_up              	   3080.71	  0.0000	    65.3723	  0.75	  1.33	   99.98%	  4096	   11.6985	 97.49%	      0.71%	  0.9506
+   16	ffn_up              	   3016.78	  0.0000	    55.2134	  0.74	  1.58	   99.98%	  4096	   11.5581	 96.32%	      0.76%	  0.9874
+   24	ffn_up              	   3010.61	  0.0000	    73.8905	  0.74	  2.21	  100.00%	  4096	   11.2557	 93.80%	      0.93%	  0.9690
+   22	ffn_up              	   2879.76	  0.0001	    77.3697	  0.70	  2.02	  100.00%	  4096	   11.3401	 94.50%	      0.81%	  0.9957
+   17	ffn_up              	   2870.70	  0.0000	    51.7692	  0.70	  1.48	   99.98%	  4096	   11.5662	 96.39%	      0.73%	  0.9959
+   23	ffn_up              	   2843.65	  0.0001	    89.6189	  0.69	  2.21	  100.00%	  4096	   11.2398	 93.66%	      0.95%	  0.9937
+   10	ffn_up              	   2833.02	  0.0000	    85.4598	  0.69	  1.74	   99.90%	  4096	   11.5267	 96.06%	      0.46%	  0.8381
+   19	ffn_up              	   2776.20	  0.0000	    70.3380	  0.68	  1.86	  100.00%	  4096	   11.3917	 94.93%	      0.71%	  0.9944
+   15	ffn_up              	   2760.72	  0.0000	    57.4514	  0.67	  1.45	   99.95%	  4096	   11.5659	 96.38%	      0.83%	  0.9038
+   18	ffn_up              	   2754.00	  0.0001	    61.1560	  0.67	  1.55	  100.00%	  4096	   11.5243	 96.04%	      0.76%	  0.9902
+   21	ffn_up              	   2737.92	  0.0000	    70.9311	  0.67	  1.86	   99.98%	  4096	   11.3741	 94.78%	      0.81%	  0.9902
+   20	ffn_up              	   2699.39	  0.0000	    65.5763	  0.66	  1.79	   99.98%	  4096	   11.3889	 94.91%	      0.83%	  0.9932
+    8	ffn_up              	   2469.90	  0.0000	   103.2819	  0.60	  1.84	   99.93%	  4096	   11.4803	 95.67%	      0.56%	  0.9061
+    2	ffn_up              	   2319.60	  0.0000	   630.8475	  0.57	 10.17	   99.80%	  4096	    8.7421	 72.85%	      0.12%	  0.0200
+    9	ffn_up              	   2312.98	  0.0000	    70.3176	  0.56	  1.47	   99.93%	  4096	   11.4845	 95.70%	      0.76%	  0.9660
+    7	ffn_up              	   2253.67	  0.0000	    58.9012	  0.55	  1.44	   99.93%	  4096	   11.5263	 96.05%	      0.54%	  0.9532
+    5	ffn_up              	   2213.64	  0.0000	   330.8649	  0.54	  5.46	   99.93%	  4096	   10.0780	 83.98%	      0.24%	  0.2463
+    6	ffn_up              	   1791.24	  0.0000	    42.9261	  0.44	  1.12	   99.90%	  4096	   11.4775	 95.65%	      0.66%	  0.2691
+    4	ffn_up              	   1789.65	  0.0000	   112.6252	  0.44	  2.11	   99.93%	  4096	   11.0733	 92.28%	      0.29%	  0.9765
+    3	ffn_up              	   1716.85	  0.0000	   175.6357	  0.42	  3.39	   99.90%	  4096	   10.3538	 86.28%	      0.22%	  0.8606
+
+Computing weighted average statistics per layer (40 layers)
+
+  Layer	     μΣ(Act²)	      μZD	μCosSim
+================================================
+    0	       4139.83	    0.7411%	0.0000
+    1	       6791.54	    2.9832%	0.1389
+    2	       7785.62	    1.9852%	0.1614
+    3	      70900.05	    1.2575%	0.5370
+    4	      15985.68	    1.4608%	0.4854
+    5	     146183.94	    0.8107%	0.4142
+    6	      18205.81	    1.3806%	0.4006
+    7	      23167.60	    1.2842%	0.5735
+    8	      17900.25	    1.4849%	0.5729
+    9	      17128.10	    1.5571%	0.6014
+   10	      15332.18	    2.2715%	0.5906
+   11	      15983.94	    1.9451%	0.6469
+   12	      17056.90	    2.1752%	0.6652
+   13	      20767.65	    2.4856%	0.6752
+   14	      19054.13	    1.1933%	0.5841
+   15	      19172.65	    1.4341%	0.5356
+   16	      26136.96	    1.8568%	0.5790
+   17	      19724.82	    2.5230%	0.6361
+   18	      22839.35	    2.4882%	0.6723
+   19	      18405.42	    1.6588%	0.6325
+   20	      23508.35	    1.5224%	0.6168
+   21	      23910.19	    1.5866%	0.5942
+   22	      24533.16	    1.1531%	0.5889
+   23	      25862.99	    1.2548%	0.5850
+   24	      19961.15	    1.3993%	0.5695
+   25	      23721.45	    0.7063%	0.5718
+   26	      22758.83	    0.8053%	0.5699
+   27	      26575.09	    1.3538%	0.5727
+   28	      28424.57	    1.0889%	0.5796
+   29	      30363.12	    1.5732%	0.5756
+   30	      38224.65	    1.7311%	0.5899
+   31	      31137.59	    1.3886%	0.5094
+   32	      39814.40	    1.8755%	0.5482
+   33	      41853.15	    1.9772%	0.5874
+   34	      52107.42	    2.3491%	0.5840
+   35	      58491.29	    1.8193%	0.5410
+   36	      77988.16	    1.1558%	0.5635
+   37	     103052.64	    1.1210%	0.5778
+   38	     145584.28	    1.5143%	0.5889
+   39	     640944.31	    1.3538%	0.5533