commit 1caced4520ca4c6b618079798369871c77a3cd4f Author: ModelHub XC Date: Wed Jun 17 16:26:16 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: duyntnet/Azzurro-imatrix-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..07c341c --- /dev/null +++ b/.gitattributes @@ -0,0 +1,62 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Azzurro-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-Q5_1.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Azzurro-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Azzurro-IQ1_M.gguf b/Azzurro-IQ1_M.gguf new file mode 100644 index 0000000..ce1b563 --- /dev/null +++ b/Azzurro-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00df6878b2fce229223d5d2c2ee615f55fc49c11c8bfa37164f4b7bbc72d4daf +size 1754446784 diff --git a/Azzurro-IQ1_S.gguf b/Azzurro-IQ1_S.gguf new file mode 100644 index 0000000..14580c0 --- /dev/null +++ b/Azzurro-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:489eecc53220bff4dc9d44645e90193a20e4d40fd2ae30a6f94d7ea6861b48a7 +size 1612102592 diff --git a/Azzurro-IQ2_M.gguf b/Azzurro-IQ2_M.gguf new file mode 100644 index 0000000..8ea0a32 --- /dev/null +++ b/Azzurro-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc9b8b497d81ce2a31c0354528755cc25a4fa8b8b24f691baf9a56d19acac5bb +size 2500713408 diff --git a/Azzurro-IQ2_S.gguf b/Azzurro-IQ2_S.gguf new file mode 100644 index 0000000..fd9955d --- /dev/null +++ b/Azzurro-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71bc20fdf83371d877d62c424de93786f48dc1aa09be77bfc91394c4bd6fbc24 +size 2310921152 diff --git a/Azzurro-IQ2_XS.gguf b/Azzurro-IQ2_XS.gguf new file mode 100644 index 0000000..f1a74a7 --- /dev/null +++ b/Azzurro-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff0e2b88d051fc4d4593eece587e85c5d429a82416e1456f33040c5313757169 +size 2198256576 diff --git a/Azzurro-IQ2_XXS.gguf b/Azzurro-IQ2_XXS.gguf new file mode 100644 index 0000000..713f229 --- /dev/null +++ b/Azzurro-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f28b9a8c7a12e1583f2882236b0e510921f4b031ee79a5b6412f498bfb0205d0 +size 1991687104 diff --git a/Azzurro-IQ3_M.gguf b/Azzurro-IQ3_M.gguf new file mode 100644 index 0000000..11646bd --- /dev/null +++ b/Azzurro-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f664eb7ba0bb3001ce4ed817f7f6720713e7cdc73ef856ead7772f05ddbe1807 +size 3284892608 diff --git a/Azzurro-IQ3_S.gguf b/Azzurro-IQ3_S.gguf new file mode 100644 index 0000000..a20641b --- /dev/null +++ b/Azzurro-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dc8cd31c7f56956dc557ca86b2ba230978e69ca78b260c39626e308ef8389df +size 3182394304 diff --git a/Azzurro-IQ3_XS.gguf b/Azzurro-IQ3_XS.gguf new file mode 100644 index 0000000..25824ed --- /dev/null +++ b/Azzurro-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ca732e7ec9b23393f9dbd2ad05fef2fe743056263abe6a2dc7d63dd39655706 +size 3018816448 diff --git a/Azzurro-IQ3_XXS.gguf b/Azzurro-IQ3_XXS.gguf new file mode 100644 index 0000000..5e8bd98 --- /dev/null +++ b/Azzurro-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b49cb0bf097dd0ee89007421ed36990d1ebd3e5ce5fd104e832130e969e409b9 +size 2827344832 diff --git a/Azzurro-IQ4_NL.gguf b/Azzurro-IQ4_NL.gguf new file mode 100644 index 0000000..11bcb47 --- /dev/null +++ b/Azzurro-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9dd51360b2dce31fd91899a5e0f5512932c72d3bc90c91235f24353ae2017e4 +size 4125694912 diff --git a/Azzurro-IQ4_XS.gguf b/Azzurro-IQ4_XS.gguf new file mode 100644 index 0000000..6c5276b --- /dev/null +++ b/Azzurro-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dd293ca9267884155ad317c797fbf018ed6260d3b54f7f955ea320c38bef372 +size 3907689408 diff --git a/Azzurro-Q2_K.gguf b/Azzurro-Q2_K.gguf new file mode 100644 index 0000000..7a2fffb --- /dev/null +++ b/Azzurro-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:072ed33f893e54b04f0eb9ef59851d3a63b2f5be74d85d6ad20ec74fd428a38f +size 2719243200 diff --git a/Azzurro-Q2_K_S.gguf b/Azzurro-Q2_K_S.gguf new file mode 100644 index 0000000..7982b3d --- /dev/null +++ b/Azzurro-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a81c3735343e8581c5b868ec0bc0a4ac38c963532d5a44d10ba178656bae1c02 +size 2528926656 diff --git a/Azzurro-Q3_K_L.gguf b/Azzurro-Q3_K_L.gguf new file mode 100644 index 0000000..e46b2d7 --- /dev/null +++ b/Azzurro-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ca8c00b597def38ebe91e877e204bfc08e606e2c6f2380485ed06f447d1c848 +size 3822025664 diff --git a/Azzurro-Q3_K_M.gguf b/Azzurro-Q3_K_M.gguf new file mode 100644 index 0000000..778bf36 --- /dev/null +++ b/Azzurro-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:774ea73c8e20b5756c61a6fa624268fc4c7d52a2e638edc7b315eb2896689b46 +size 3518987200 diff --git a/Azzurro-Q3_K_S.gguf b/Azzurro-Q3_K_S.gguf new file mode 100644 index 0000000..988d9cb --- /dev/null +++ b/Azzurro-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73ceffe723d0bf27612aa1dce6ddd1e7a6a6e7dcd0946b81f3c0d2fc99d12877 +size 3164568512 diff --git a/Azzurro-Q4_0.gguf b/Azzurro-Q4_0.gguf new file mode 100644 index 0000000..21fd044 --- /dev/null +++ b/Azzurro-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1969d712225280728df9e23743d233c7c6c07525ee1fa71289debe0cf27d8deb +size 4123597760 diff --git a/Azzurro-Q4_1.gguf b/Azzurro-Q4_1.gguf new file mode 100644 index 0000000..866b5f2 --- /dev/null +++ b/Azzurro-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c7cfc8e2e3a724b7ab554e3052d80d716f190b75ad76d0629afeb3c78afe45c +size 4553317312 diff --git a/Azzurro-Q4_K_M.gguf b/Azzurro-Q4_K_M.gguf new file mode 100644 index 0000000..a1bcdbd --- /dev/null +++ b/Azzurro-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecdea91b288df5f8f38f1426b30d8afafb73eaca11c86e1701ae73e9fb5a1db0 +size 4368440256 diff --git a/Azzurro-Q4_K_S.gguf b/Azzurro-Q4_K_S.gguf new file mode 100644 index 0000000..e7bde46 --- /dev/null +++ b/Azzurro-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:696f480a2ff8b8c1e001ad6e4f80c3c27ea9fde300523816dc3fe2e3f428709c +size 4140374976 diff --git a/Azzurro-Q5_0.gguf b/Azzurro-Q5_0.gguf new file mode 100644 index 0000000..e39f535 --- /dev/null +++ b/Azzurro-Q5_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:849a429592d90125b42e289e0a3b14e0bf91ff3994cd8cfbea69a00c5d0eed85 +size 5012396992 diff --git a/Azzurro-Q5_1.gguf b/Azzurro-Q5_1.gguf new file mode 100644 index 0000000..832830b --- /dev/null +++ b/Azzurro-Q5_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:504ed2e44e166df1ec424e1a2d69644e68ef93c99dd4aa2aeedd8e5d2e2c460a +size 5442116544 diff --git a/Azzurro-Q5_K_M.gguf b/Azzurro-Q5_K_M.gguf new file mode 100644 index 0000000..223f1ae --- /dev/null +++ b/Azzurro-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5499deb7271dc238d4363321bb1e4691ae17e788e64a4cec47defbccb70352b9 +size 5131410368 diff --git a/Azzurro-Q5_K_S.gguf b/Azzurro-Q5_K_S.gguf new file mode 100644 index 0000000..675d219 --- /dev/null +++ b/Azzurro-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b65ee4d2d82945e0bded3868f92bd909e86248ca017c27d1a446b5bb86083be5 +size 4997716928 diff --git a/Azzurro-Q6_K.gguf b/Azzurro-Q6_K.gguf new file mode 100644 index 0000000..01cf722 --- /dev/null +++ b/Azzurro-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d2a15d00bda7ddf3392fa408c1f93c0eae472830b0e97c51473a8a3899ab1c2 +size 5942066112 diff --git a/Azzurro-Q8_0.gguf b/Azzurro-Q8_0.gguf new file mode 100644 index 0000000..bf531fb --- /dev/null +++ b/Azzurro-Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06395aff8e30a5de0f473cf551ba09333bbff4c2cf5f2e72ab0bf10f06eec588 +size 7695858624 diff --git a/README.md b/README.md new file mode 100644 index 0000000..7527a93 --- /dev/null +++ b/README.md @@ -0,0 +1,62 @@ +--- +license: other +language: +- en +pipeline_tag: text-generation +inference: false +tags: +- transformers +- gguf +- imatrix +- Azzurro +--- +Quantizations of https://huggingface.co/MoxoffSpA/Azzurro + + +# From original readme + +## Usage + +Be sure to install these dependencies before running the program + +```python +!pip install transformers torch sentencepiece +``` + +```python +from transformers import AutoModelForCausalLM, AutoTokenizer + +device = "cpu" # if you want to use the gpu make sure to have cuda toolkit installed and change this to "cuda" + +model = AutoModelForCausalLM.from_pretrained("MoxoffSpA/Azzurro") +tokenizer = AutoTokenizer.from_pretrained("MoxoffSpA/Azzurro") + +question = """Quanto è alta la torre di Pisa?""" +context = """ +La Torre di Pisa è un campanile del XII secolo, famoso per la sua inclinazione. Alta circa 56 metri. +""" + +prompt = f"Domanda: {question}, contesto: {context}" + +messages = [ + {"role": "user", "content": prompt} +] + +encodeds = tokenizer.apply_chat_template(messages, return_tensors="pt") + +model_inputs = encodeds.to(device) +model.to(device) + +generated_ids = model.generate( + model_inputs, # The input to the model + max_new_tokens=128, # Limiting the maximum number of new tokens generated + do_sample=True, # Enabling sampling to introduce randomness in the generation + temperature=0.1, # Setting temperature to control the randomness, lower values make it more deterministic + top_p=0.95, # Using nucleus sampling with top-p filtering for more coherent generation + eos_token_id=tokenizer.eos_token_id # Specifying the token that indicates the end of a sequence +) + +decoded_output = tokenizer.decode(generated_ids[0], skip_special_tokens=True) +trimmed_output = decoded_output.strip() +print(trimmed_output) +``` \ No newline at end of file