diff --git a/Llama-3.2-3B-Instruct-Q2_K.gguf b/Llama-3.2-3B-Instruct-Q2_K.gguf index d0c528e..d43c602 100644 --- a/Llama-3.2-3B-Instruct-Q2_K.gguf +++ b/Llama-3.2-3B-Instruct-Q2_K.gguf @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f355e9b1a6c69ee7ea297f8b3bb38c44ab00ad7bc9f699babe0a02eae61cf276 +oid sha256:2dabdba85d46f31b464a0fded5631c5bddec151caefb45dd8f4894e477c41897 size 1363935520 diff --git a/Llama-3.2-3B-Instruct-Q3_K_L.gguf b/Llama-3.2-3B-Instruct-Q3_K_L.gguf index 403cb8f..0feb274 100644 --- a/Llama-3.2-3B-Instruct-Q3_K_L.gguf +++ b/Llama-3.2-3B-Instruct-Q3_K_L.gguf @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f778dda3fa1dd1c34747038221113b7940b3b26645e50775bbc8b4a8997040c6 +oid sha256:57d59b635b58cc4ce331a86aa197624837af97b40d26c22c284358cd8de1cd9f size 1815347488 diff --git a/Llama-3.2-3B-Instruct-Q3_K_M.gguf b/Llama-3.2-3B-Instruct-Q3_K_M.gguf index 481e92d..88a061a 100644 --- a/Llama-3.2-3B-Instruct-Q3_K_M.gguf +++ b/Llama-3.2-3B-Instruct-Q3_K_M.gguf @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:21c7b1e2c11ce80e0de67c3b6aeace40edf6cd0c6606d3c0085117b9c8951669 +oid sha256:84a27af779dabc1480470b8950e5d6d060957f4fe8df165863981d5fe77be4da size 1687159072 diff --git a/Llama-3.2-3B-Instruct-Q3_K_S.gguf b/Llama-3.2-3B-Instruct-Q3_K_S.gguf index f0f23c9..3b8e8b9 100644 --- a/Llama-3.2-3B-Instruct-Q3_K_S.gguf +++ b/Llama-3.2-3B-Instruct-Q3_K_S.gguf @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:24f06a24cf262e93c9c25dea3f207593e23293df4732a49cdc887bbf3d145e14 +oid sha256:8434d06c50ff5c8113fefbd0e275d8879ac15ec29c5330d3fee61b295a3490f4 size 1542848800 diff --git a/Llama-3.2-3B-Instruct-Q4_0.gguf b/Llama-3.2-3B-Instruct-Q4_0.gguf index e221e32..5cefed3 100644 --- a/Llama-3.2-3B-Instruct-Q4_0.gguf +++ b/Llama-3.2-3B-Instruct-Q4_0.gguf @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:aec4181a9debbcd9213f4c8e6b4b33bd24181feb373332d904839492a8b4169b +oid sha256:8cc8df7386113cadf7f592fcf4a25cf9ac46083ee44b521132b4448261031d99 size 1917190432 diff --git a/Llama-3.2-3B-Instruct-Q4_K_M.gguf b/Llama-3.2-3B-Instruct-Q4_K_M.gguf index 524f921..a4d0913 100644 --- a/Llama-3.2-3B-Instruct-Q4_K_M.gguf +++ b/Llama-3.2-3B-Instruct-Q4_K_M.gguf @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e4f1a04d927b09ec18eb2f233d85ecd760fc2d35cec97e37f8604d3632210d9a +oid sha256:c5e6cf2c071a429e2380d2d1182c06a20b8c999d0c059636530e4a84beb8e8d4 size 2019377440 diff --git a/Llama-3.2-3B-Instruct-Q4_K_S.gguf b/Llama-3.2-3B-Instruct-Q4_K_S.gguf index c848b0c..75a5002 100644 --- a/Llama-3.2-3B-Instruct-Q4_K_S.gguf +++ b/Llama-3.2-3B-Instruct-Q4_K_S.gguf @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5f3e5cc3cb1d83b9b9b2876250db8703d93eb23803598eafd3aafe5b5da99d1f +oid sha256:9054a2b99ae8e37d70b484dccde32b2eedc5d9510330d1d05a3ff90147a24ec7 size 1928200480 diff --git a/Llama-3.2-3B-Instruct-Q5_0.gguf b/Llama-3.2-3B-Instruct-Q5_0.gguf index 99fcd1e..6aedb6a 100644 --- a/Llama-3.2-3B-Instruct-Q5_0.gguf +++ b/Llama-3.2-3B-Instruct-Q5_0.gguf @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c112217953cbe9e97e03ac9e459d1629cf939ccaf669bde8250901cf2277ef4c +oid sha256:0ae5f5bfd45f7516e8253d78f300c3e4be328291ca3e0eb3b5bf7b8d867ab740 size 2269511968 diff --git a/Llama-3.2-3B-Instruct-Q5_K_M.gguf b/Llama-3.2-3B-Instruct-Q5_K_M.gguf index ccfafb2..da6de4e 100644 --- a/Llama-3.2-3B-Instruct-Q5_K_M.gguf +++ b/Llama-3.2-3B-Instruct-Q5_K_M.gguf @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5fcbaeaa8e8cd835fd38f2d1daccd58816ba79af262d2335b7454cf0bd21d7cf +oid sha256:e02e674781b7e2fe80318de645397f957f7b768e86edb42bd9fa0a120578855b size 2322153760 diff --git a/Llama-3.2-3B-Instruct-Q5_K_S.gguf b/Llama-3.2-3B-Instruct-Q5_K_S.gguf index deebd9b..5ff7087 100644 --- a/Llama-3.2-3B-Instruct-Q5_K_S.gguf +++ b/Llama-3.2-3B-Instruct-Q5_K_S.gguf @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a47518afcfee91bf0b4a6da63ad87774b9dc403a643f3450fb1761fd5a03b59d +oid sha256:19b73a5b64fda6f297cc6e031a0b5055b8ef4ed9e09a90d9599150a247cf4b1e size 2269511968 diff --git a/Llama-3.2-3B-Instruct-Q6_K.gguf b/Llama-3.2-3B-Instruct-Q6_K.gguf index 4efd68b..25f60f0 100644 --- a/Llama-3.2-3B-Instruct-Q6_K.gguf +++ b/Llama-3.2-3B-Instruct-Q6_K.gguf @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2ccc943ca31e72526a309b319b15d1ec453cd1c01e27aea4731ccc6a3bfab264 +oid sha256:51c797166082bed6c67fcc8d5d745eb9b4f23455dd35f0d4b0fbb88b04b33e7b size 2643853600 diff --git a/Llama-3.2-3B-Instruct-Q8_0.gguf b/Llama-3.2-3B-Instruct-Q8_0.gguf index d6716c1..663296f 100644 --- a/Llama-3.2-3B-Instruct-Q8_0.gguf +++ b/Llama-3.2-3B-Instruct-Q8_0.gguf @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:94f22b7231df5cd1907ff48dba54497b2d7912a4ce60d914f3dcfc0347fa8f21 +oid sha256:45b690c2640b7c36e2ccb9305a858f8a95d804711e3f90743d646e1808949e1f size 3421899040 diff --git a/README.md b/README.md index cd9a764..755325f 100644 --- a/README.md +++ b/README.md @@ -37,7 +37,7 @@ tags: ## Run with LlamaEdge -- LlamaEdge version: [v0.14.5](https://github.com/LlamaEdge/LlamaEdge/releases/tag/0.14.5) and above +- LlamaEdge version: [v0.16.5](https://github.com/LlamaEdge/LlamaEdge/releases/tag/0.16.5) and above - Prompt template @@ -126,4 +126,4 @@ tags: | [Llama-3.2-3B-Instruct-Q8_0.gguf](https://huggingface.co/second-state/Llama-3.2-3B-Instruct-GGUF/blob/main/Llama-3.2-3B-Instruct-Q8_0.gguf) | Q8_0 | 8 | 1.32 GB| very large, extremely low quality loss - not recommended | | [Llama-3.2-3B-Instruct-f16.gguf](https://huggingface.co/second-state/Llama-3.2-3B-Instruct-GGUF/blob/main/Llama-3.2-3B-Instruct-f16.gguf) | f16 | 16 | 2.48 GB| | -*Quantized with llama.cpp b3807* +*Quantized with llama.cpp b4466*