初始化项目，由ModelHub XC社区提供模型

Model: Shinzmann/naija-petro-GGUF Source: Original Platform
2026-06-11 05:14:16 +08:00
commit 0da4f955c7
8 changed files with 258 additions and 0 deletions
--- a/.gitattributes
+++ b/.gitattributes
@@ -0,0 +1,39 @@
+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text
+Qwen3-32B.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+Qwen3-32B.BF16-00002-of-00002.gguf filter=lfs diff=lfs merge=lfs -text
+Qwen3-32B.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+Qwen3-32B.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
--- a/59
+++ b/59
@@ -0,0 +1,59 @@
+
+FROM Qwen3-32B.Q8_0.gguf
+TEMPLATE """{{- if .Messages }}
+{{- if or .System .Tools }}<|im_start|>system
+{{- if .System }}
+{{ .System }}
+{{- end }}
+{{- if .Tools }}
+
+# Tools
+
+You may call one or more functions to assist with the user query.
+
+You are provided with function signatures within <tools></tools> XML tags:
+<tools>
+{{- range .Tools }}
+{"type": "function", "function": {{ .Function }}}
+{{- end }}
+</tools>
+
+For each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:
+<tool_call>
+{"name": <function-name>, "arguments": <args-json-object>}
+</tool_call>
+{{- end }}<|im_end|>
+{{ end }}
+{{- range $i, $_ := .Messages }}
+{{- $last := eq (len (slice $.Messages $i)) 1 -}}
+{{- if eq .Role "user" }}<|im_start|>user
+{{ .Content }}<|im_end|>
+{{ else if eq .Role "assistant" }}<|im_start|>assistant
+{{ if .Content }}{{ .Content }}
+{{- else if .ToolCalls }}<tool_call>
+{{ range .ToolCalls }}{"name": "{{ .Function.Name }}", "arguments": {{ .Function.Arguments }}}
+{{ end }}</tool_call>
+{{- end }}{{ if not $last }}<|im_end|>
+{{ end }}
+{{- else if eq .Role "tool" }}<|im_start|>user
+<tool_response>
+{{ .Content }}
+</tool_response><|im_end|>
+{{ end }}
+{{- if and (ne .Role "assistant") $last }}<|im_start|>assistant
+{{ end }}
+{{- end }}
+{{- else }}
+{{- if .System }}<|im_start|>system
+{{ .System }}<|im_end|>
+{{ end }}{{ if .Prompt }}<|im_start|>user
+{{ .Prompt }}<|im_end|>
+{{ end }}<|im_start|>assistant
+{{ end }}{{ .Response }}{{ if .Response }}<|im_end|>{{ end }}"""
+PARAMETER stop "<|im_end|>"
+PARAMETER stop "<|im_start|>"
+PARAMETER temperature 0.6
+PARAMETER min_p 0.0
+PARAMETER top_k 20
+PARAMETER top_p 0.95
+PARAMETER repeat_penalty 1
--- a/Qwen3-32B.BF16-00002-of-00002.gguf
+++ b/Qwen3-32B.BF16-00002-of-00002.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f74ef6d23b3cf787ba60d21c8912745e03e0630ddd0afb305d01044fe16804e3
+size 15659811424
--- a/Qwen3-32B.Q4_K_M.gguf
+++ b/Qwen3-32B.Q4_K_M.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a49e4b593eda8bbc997c00b4b352722a05e593b1505c84c0475cac67d5f81523
+size 19762149568
--- a/Qwen3-32B.Q5_K_M.gguf
+++ b/Qwen3-32B.Q5_K_M.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ef5a0f984cdbb5a5e0b2ca18b5beec5785033f21682146d427a467442ff4f55d
+size 23214831808
--- a/Qwen3-32B.Q8_0.gguf
+++ b/Qwen3-32B.Q8_0.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b6c8c64b438ff2022e81a3eeadfa1f524d97c2e95ea6370ab3afa1a8331f538e
+size 34817719488
--- a/README.md
+++ b/README.md
@@ -0,0 +1,48 @@
+---
+license: apache-2.0
+language:
+- en
+base_model: Shinzmann/naija-petro
+pipeline_tag: text-generation
+tags:
+- petroleum-engineering
+- oil-and-gas
+- nigeria
+- qwen3
+- gguf
+- llama-cpp
+- ollama
+- quantized
+---
+
+# Naija-Petro (32B) — GGUF
+
+GGUF quantizations of [`Shinzmann/naija-petro`](https://huggingface.co/Shinzmann/naija-petro) (the 32B variant) for inference with [llama.cpp](https://github.com/ggerganov/llama.cpp), [Ollama](https://ollama.com), LM Studio, and compatible runtimes.
+
+See the full [model card](https://huggingface.co/Shinzmann/naija-petro) for training details, intended use, and limitations. For a lighter footprint, consider the [8B GGUF](https://huggingface.co/Shinzmann/naija-petro-8b-GGUF). For Nigeria-specific accuracy, use these weights with the [Naija-Petro RAG system](https://github.com/Mystique1337/naija-petro).
+
+## Available quantizations
+
+| File suffix | Method | Notes |
+|---|---|---|
+| `Q4_K_M` | 4-bit (k-quant, medium) | Smallest; recommended default for 32B on limited RAM/VRAM |
+| `Q5_K_M` | 5-bit (k-quant, medium) | Higher quality, larger |
+| `Q8_0`   | 8-bit | Near-lossless; largest and slowest |
+
+> 32B GGUF files are large. Q4_K_M is the practical choice for most machines; ensure you have enough RAM/VRAM + disk for the chosen quant.
+
+## Usage
+
+**Ollama**
+```bash
+ollama run hf.co/Shinzmann/naija-petro-GGUF:Q4_K_M
+```
+
+**llama.cpp**
+```bash
+./llama-cli -hf Shinzmann/naija-petro-GGUF:Q4_K_M \
+  -p "What are the screening criteria for CO2 EOR?" -c 4096
+```
+
+## License
+Apache-2.0 (inherited from Qwen3-32B). Validate outputs with qualified engineers before operational use.
--- a/config.json
+++ b/config.json
@@ -0,0 +1,100 @@
+{
+    "architectures": [
+        "Qwen3ForCausalLM"
+    ],
+    "attention_bias": false,
+    "attention_dropout": 0.0,
+    "bos_token_id": null,
+    "torch_dtype": "bfloat16",
+    "eos_token_id": 151645,
+    "head_dim": 128,
+    "hidden_act": "silu",
+    "hidden_size": 5120,
+    "initializer_range": 0.02,
+    "intermediate_size": 25600,
+    "layer_types": [
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention",
+        "full_attention"
+    ],
+    "max_position_embeddings": 40960,
+    "max_window_layers": 64,
+    "model_type": "qwen3",
+    "num_attention_heads": 64,
+    "num_hidden_layers": 64,
+    "num_key_value_heads": 8,
+    "pad_token_id": 151669,
+    "rms_norm_eps": 1e-06,
+    "rope_parameters": {
+        "rope_theta": 1000000,
+        "rope_type": "default"
+    },
+    "sliding_window": null,
+    "tie_word_embeddings": false,
+    "unsloth_fixed": true,
+    "unsloth_version": "2026.3.7",
+    "use_cache": false,
+    "use_sliding_window": false,
+    "vocab_size": 151936
+}