初始化项目,由ModelHub XC社区提供模型

Model: duyntnet/Mistral-Nemo-Instruct-2407-imatrix-GGUF
Source: Original Platform
This commit is contained in:
ModelHub XC
2026-06-17 16:17:17 +08:00
commit dadac179e6
29 changed files with 313 additions and 0 deletions

62
.gitattributes vendored Normal file
View File

@@ -0,0 +1,62 @@
*.7z filter=lfs diff=lfs merge=lfs -text
*.arrow filter=lfs diff=lfs merge=lfs -text
*.bin filter=lfs diff=lfs merge=lfs -text
*.bz2 filter=lfs diff=lfs merge=lfs -text
*.ckpt filter=lfs diff=lfs merge=lfs -text
*.ftz filter=lfs diff=lfs merge=lfs -text
*.gz filter=lfs diff=lfs merge=lfs -text
*.h5 filter=lfs diff=lfs merge=lfs -text
*.joblib filter=lfs diff=lfs merge=lfs -text
*.lfs.* filter=lfs diff=lfs merge=lfs -text
*.mlmodel filter=lfs diff=lfs merge=lfs -text
*.model filter=lfs diff=lfs merge=lfs -text
*.msgpack filter=lfs diff=lfs merge=lfs -text
*.npy filter=lfs diff=lfs merge=lfs -text
*.npz filter=lfs diff=lfs merge=lfs -text
*.onnx filter=lfs diff=lfs merge=lfs -text
*.ot filter=lfs diff=lfs merge=lfs -text
*.parquet filter=lfs diff=lfs merge=lfs -text
*.pb filter=lfs diff=lfs merge=lfs -text
*.pickle filter=lfs diff=lfs merge=lfs -text
*.pkl filter=lfs diff=lfs merge=lfs -text
*.pt filter=lfs diff=lfs merge=lfs -text
*.pth filter=lfs diff=lfs merge=lfs -text
*.rar filter=lfs diff=lfs merge=lfs -text
*.safetensors filter=lfs diff=lfs merge=lfs -text
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.tar.* filter=lfs diff=lfs merge=lfs -text
*.tar filter=lfs diff=lfs merge=lfs -text
*.tflite filter=lfs diff=lfs merge=lfs -text
*.tgz filter=lfs diff=lfs merge=lfs -text
*.wasm filter=lfs diff=lfs merge=lfs -text
*.xz filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-Q5_1.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
Mistral-Nemo-Instruct-2407-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:dbebafc8a9938b65d66b917ecbb5c2b2313e6a2fe243b6bdfa11e1fd1808acc7
size 3221625184

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:e1798defc43b0188add2bbc0d43d19dd3cdbec6c14d6c9c1c545fdf4928a4413
size 2999212384

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:7d77d641be761cc1c9db8a8d0f76fd00f6b1f4d095ad6084fac24c78085b5998
size 4435024224

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:ab2208cf6520b1ad4bae2b2ff07c5d671aefad13b141eb799a702e27cb2f39a7
size 4138473824

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:016a6ac54964fdc93e518861c38b3303633c5558ee22bb575ed00d2176c38a64
size 3915077984

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:61ab470a776083b9e999a795d9e215ff12875b1422eef8e2f04c6b5b66e84efd
size 3592313184

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:25d3c2aa841e71d20c59a6c6f512bda251d73f28e83e21761c25102bf5bb80b5
size 5722233184

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:0338fee950156b123ec148fe590a5eb89f876deb27f1fa0c6391427244513db0
size 5562079584

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:a83500275712097b0994d3e2d2556331efb672e562c5414c8af7ff3aaf27f1d4
size 5306489184

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:a275677290c9d3f6325f5d4753707a21701f1bc94851945b829d82924fb45274
size 4945385824

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:2db15f56e3cc628b0665e45fd6e8a1c8adf1c1ceea8f28b23cdf3099aae631be
size 7097915744

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:d59e12be67e24620842998e26a7236794d2c9fa72f9853481d34fc776210930f
size 6742710624

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:70844873ed499440da257cd4537ebf70a62e26dc3bfcf058be93023310af2fca
size 4791048544

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:1e566bdd39a341dd8f0fca5f0eae04a5225572968fb444bb4a03f7197d2bc691
size 4493678944

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:d9e513f880e6c5d598e93154290e7d4017646dddf95d899a0c2c244ac8e26f22
size 6561503584

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:ecce7c3eaf2b0334bf4b29cdfb5bbbc09b92953e75b13b184cb46aa6489624ef
size 6083090784

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:cef895c37a7a01c797148b2ff2269da8b82b0d9d82030cdf3a9398739830a991
size 5534226784

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:5dbb82cf3b4fd7d8f38d811cbbcb448a3a52148c60976e5006447b51670aa222
size 7094638944

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:bd94c5307b3ca02a734ef8cf323aa9e1964a81ad422be2bb25b332825f27aaea
size 7795218784

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:6e68a8fd463e0917de33321e817a9e1a0d2b5779db24841301efdc4406e580f2
size 7477205344

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:6b816d8b12e96d4b9a5f6a1f7f009ee7e835954d147a72f321151c480de694e3
size 7120197984

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:3e3bd69402e3f02644b8bc6e9b969ddf45e07c22fae323bc652dbb99d9f9bff9
size 8541673824

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:b5cb487c3ff7a043dddf10e9f5ca71b45514f527539ee41a22739dacb4ef9436
size 9242253664

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:41d0712c80195dd58f1810a68915ab243a74c41393205c19f82abd18ddf8bd32
size 8727632224

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:858800c1f7fd112822c02e34cd271e74ce5dd1ab052e856c4e30786a3e38f4f3
size 8518736224

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:e4e82039e134919e2e7cce55562a46e277fa5aa63d041e1bcc6d47d4f31a1001
size 10056210784

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:269a2828d16358a449ea0ccb39750cc9c4a2baa60762d39ae1c40fdfb4fced56
size 13022370144

170
README.md Normal file
View File

@@ -0,0 +1,170 @@
---
license: other
language:
- en
pipeline_tag: text-generation
inference: false
tags:
- transformers
- gguf
- imatrix
- Mistral-Nemo-Instruct-2407
---
Quantizations of https://huggingface.co/mistralai/Mistral-Nemo-Instruct-2407
### Inference Clients/UIs
* [llama.cpp](https://github.com/ggerganov/llama.cpp)
* [JanAI](https://github.com/janhq/jan)
* [KoboldCPP](https://github.com/LostRuins/koboldcpp)
* [text-generation-webui](https://github.com/oobabooga/text-generation-webui)
* [ollama](https://github.com/ollama/ollama)
* [GPT4All](https://github.com/nomic-ai/gpt4all)
---
# From original readme
## Usage
The model can be used with three different frameworks
- [`mistral_inference`](https://github.com/mistralai/mistral-inference): See [here](https://huggingface.co/mistralai/Mistral-Nemo-Instruct-2407#mistral-inference)
- [`transformers`](https://github.com/huggingface/transformers): See [here](#transformers)
- [`NeMo`](https://github.com/NVIDIA/NeMo): See [nvidia/Mistral-NeMo-12B-Instruct](https://huggingface.co/nvidia/Mistral-NeMo-12B-Instruct)
### Mistral Inference
#### Install
It is recommended to use `mistralai/Mistral-Nemo-Instruct-2407` with [mistral-inference](https://github.com/mistralai/mistral-inference). For HF transformers code snippets, please keep scrolling.
```
pip install mistral_inference
```
#### Download
```py
from huggingface_hub import snapshot_download
from pathlib import Path
mistral_models_path = Path.home().joinpath('mistral_models', 'Nemo-Instruct')
mistral_models_path.mkdir(parents=True, exist_ok=True)
snapshot_download(repo_id="mistralai/Mistral-Nemo-Instruct-2407", allow_patterns=["params.json", "consolidated.safetensors", "tekken.json"], local_dir=mistral_models_path)
```
#### Chat
After installing `mistral_inference`, a `mistral-chat` CLI command should be available in your environment. You can chat with the model using
```
mistral-chat $HOME/mistral_models/Nemo-Instruct --instruct --max_tokens 256 --temperature 0.35
```
*E.g.* Try out something like:
```
How expensive would it be to ask a window cleaner to clean all windows in Paris. Make a reasonable guess in US Dollar.
```
#### Instruct following
```py
from mistral_inference.transformer import Transformer
from mistral_inference.generate import generate
from mistral_common.tokens.tokenizers.mistral import MistralTokenizer
from mistral_common.protocol.instruct.messages import UserMessage
from mistral_common.protocol.instruct.request import ChatCompletionRequest
tokenizer = MistralTokenizer.from_file(f"{mistral_models_path}/tekken.json")
model = Transformer.from_folder(mistral_models_path)
prompt = "How expensive would it be to ask a window cleaner to clean all windows in Paris. Make a reasonable guess in US Dollar."
completion_request = ChatCompletionRequest(messages=[UserMessage(content=prompt)])
tokens = tokenizer.encode_chat_completion(completion_request).tokens
out_tokens, _ = generate([tokens], model, max_tokens=64, temperature=0.35, eos_id=tokenizer.instruct_tokenizer.tokenizer.eos_id)
result = tokenizer.decode(out_tokens[0])
print(result)
```
#### Function calling
```py
from mistral_common.protocol.instruct.tool_calls import Function, Tool
from mistral_inference.transformer import Transformer
from mistral_inference.generate import generate
from mistral_common.tokens.tokenizers.mistral import MistralTokenizer
from mistral_common.protocol.instruct.messages import UserMessage
from mistral_common.protocol.instruct.request import ChatCompletionRequest
tokenizer = MistralTokenizer.from_file(f"{mistral_models_path}/tekken.json")
model = Transformer.from_folder(mistral_models_path)
completion_request = ChatCompletionRequest(
tools=[
Tool(
function=Function(
name="get_current_weather",
description="Get the current weather",
parameters={
"type": "object",
"properties": {
"location": {
"type": "string",
"description": "The city and state, e.g. San Francisco, CA",
},
"format": {
"type": "string",
"enum": ["celsius", "fahrenheit"],
"description": "The temperature unit to use. Infer this from the users location.",
},
},
"required": ["location", "format"],
},
)
)
],
messages=[
UserMessage(content="What's the weather like today in Paris?"),
],
)
tokens = tokenizer.encode_chat_completion(completion_request).tokens
out_tokens, _ = generate([tokens], model, max_tokens=256, temperature=0.35, eos_id=tokenizer.instruct_tokenizer.tokenizer.eos_id)
result = tokenizer.decode(out_tokens[0])
print(result)
```
### Transformers
> [!IMPORTANT]
> NOTE: Until a new release has been made, you need to install transformers from source:
> ```sh
> pip install git+https://github.com/huggingface/transformers.git
> ```
If you want to use Hugging Face `transformers` to generate text, you can do something like this.
```py
from transformers import pipeline
messages = [
{"role": "system", "content": "You are a pirate chatbot who always responds in pirate speak!"},
{"role": "user", "content": "Who are you?"},
]
chatbot = pipeline("text-generation", model="mistralai/Mistral-Nemo-Instruct-2407")
chatbot(messages)
```
> [!TIP]
> Unlike previous Mistral models, Mistral Nemo requires smaller temperatures. We recommend to use a temperature of 0.3.