CUDA: MMQ support for iq4_nl, iq4_xs (#8278)

This commit is contained in:
Johannes Gäßler
2024-07-05 09:06:31 +02:00
committed by GitHub
parent 0a423800ff
commit 8e558309dc
7 changed files with 226 additions and 80 deletions

View File

@@ -0,0 +1,5 @@
// This file has been autogenerated by generate_cu_files.py, do not edit manually.
#include "../mmq.cuh"
DECL_MMQ_CASE(GGML_TYPE_IQ4_XS);