初始化项目,由ModelHub XC社区提供模型
Model: gabriellarson/Mamba-Codestral-7B-v0.1-GGUF Source: Original Platform
This commit is contained in:
61
.gitattributes
vendored
Normal file
61
.gitattributes
vendored
Normal file
@@ -0,0 +1,61 @@
|
||||
*.7z filter=lfs diff=lfs merge=lfs -text
|
||||
*.arrow filter=lfs diff=lfs merge=lfs -text
|
||||
*.bin filter=lfs diff=lfs merge=lfs -text
|
||||
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
||||
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
||||
*.ftz filter=lfs diff=lfs merge=lfs -text
|
||||
*.gz filter=lfs diff=lfs merge=lfs -text
|
||||
*.h5 filter=lfs diff=lfs merge=lfs -text
|
||||
*.joblib filter=lfs diff=lfs merge=lfs -text
|
||||
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
||||
*.model filter=lfs diff=lfs merge=lfs -text
|
||||
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||
*.npy filter=lfs diff=lfs merge=lfs -text
|
||||
*.npz filter=lfs diff=lfs merge=lfs -text
|
||||
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||
*.parquet filter=lfs diff=lfs merge=lfs -text
|
||||
*.pb filter=lfs diff=lfs merge=lfs -text
|
||||
*.pickle filter=lfs diff=lfs merge=lfs -text
|
||||
*.pkl filter=lfs diff=lfs merge=lfs -text
|
||||
*.pt filter=lfs diff=lfs merge=lfs -text
|
||||
*.pth filter=lfs diff=lfs merge=lfs -text
|
||||
*.rar filter=lfs diff=lfs merge=lfs -text
|
||||
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
||||
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar filter=lfs diff=lfs merge=lfs -text
|
||||
*.tflite filter=lfs diff=lfs merge=lfs -text
|
||||
*.tgz filter=lfs diff=lfs merge=lfs -text
|
||||
*.wasm filter=lfs diff=lfs merge=lfs -text
|
||||
*.xz filter=lfs diff=lfs merge=lfs -text
|
||||
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Mamba-Codestral-7B-v0.1-F16.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
3
Mamba-Codestral-7B-v0.1-F16.gguf
Normal file
3
Mamba-Codestral-7B-v0.1-F16.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:a4c5799201ea64de1bc34e8caf200d6d71c06e70a6fa5ac2e98579c6005f631d
|
||||
size 14579764032
|
||||
3
Mamba-Codestral-7B-v0.1-IQ1_M.gguf
Normal file
3
Mamba-Codestral-7B-v0.1-IQ1_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:ca658aee1c0c43f9b5654b65a9c6c4987f84b19069661c38809706b313cde2a1
|
||||
size 1687522368
|
||||
3
Mamba-Codestral-7B-v0.1-IQ1_S.gguf
Normal file
3
Mamba-Codestral-7B-v0.1-IQ1_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:dd0d6bd5ba4f5da0f99bc32d921b7d5990ec2863fe146bd23ea81306eabbfa07
|
||||
size 1523158080
|
||||
3
Mamba-Codestral-7B-v0.1-IQ2_M.gguf
Normal file
3
Mamba-Codestral-7B-v0.1-IQ2_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:c645d4ce48eef66fb753deeb035087660de8901b1af46538d6aaf0255adfa4ab
|
||||
size 2413399104
|
||||
3
Mamba-Codestral-7B-v0.1-IQ2_S.gguf
Normal file
3
Mamba-Codestral-7B-v0.1-IQ2_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:2a46490d176dde38af7949d70703ac53cfea11df6cd2c3bda1ab275ca316bdcc
|
||||
size 2194246720
|
||||
3
Mamba-Codestral-7B-v0.1-IQ2_XS.gguf
Normal file
3
Mamba-Codestral-7B-v0.1-IQ2_XS.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:1e057b146bb168c9b0920f5f74724964b47500165d01cd381e7102f371c03cbd
|
||||
size 2180615232
|
||||
3
Mamba-Codestral-7B-v0.1-IQ2_XXS.gguf
Normal file
3
Mamba-Codestral-7B-v0.1-IQ2_XXS.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:1669d2b560b292bcd67d56bc60f1e17e040f663a1635afc3b0fbc0e197f966cc
|
||||
size 1961462848
|
||||
3
Mamba-Codestral-7B-v0.1-IQ3_M.gguf
Normal file
3
Mamba-Codestral-7B-v0.1-IQ3_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:0f9f2e0aab6bf07a1e1fb8fe02748275b013507eeb71a8489643169c8c20ac43
|
||||
size 3198258240
|
||||
3
Mamba-Codestral-7B-v0.1-IQ3_XXS.gguf
Normal file
3
Mamba-Codestral-7B-v0.1-IQ3_XXS.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:3293b962067709847c7e9079083a79587ad0de5bb18c6a44e65bdfd0d7533759
|
||||
size 2851703872
|
||||
3
Mamba-Codestral-7B-v0.1-IQ4_NL.gguf
Normal file
3
Mamba-Codestral-7B-v0.1-IQ4_NL.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:3a4147b0d71280a480003f1ffc0d966195b3d6df26901ff24590d1c1e86dcd69
|
||||
size 4147481664
|
||||
3
Mamba-Codestral-7B-v0.1-IQ4_XS.gguf
Normal file
3
Mamba-Codestral-7B-v0.1-IQ4_XS.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:aaa724a9a3e86c69c150e86d4b02619546259ac94c74a6e6b8a12e0d7d2c8e93
|
||||
size 3924134976
|
||||
3
Mamba-Codestral-7B-v0.1-Q2_K.gguf
Normal file
3
Mamba-Codestral-7B-v0.1-Q2_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:4a91f568957c1fc33c2311f9bfa235e02389229e67a3adc61cb7058ae8edd927
|
||||
size 2472381504
|
||||
3
Mamba-Codestral-7B-v0.1-Q3_K_M.gguf
Normal file
3
Mamba-Codestral-7B-v0.1-Q3_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:564921706cb0f3903b2585365eb92042a50a3a030b3d0c0a7975482761a895f8
|
||||
size 3198258240
|
||||
3
Mamba-Codestral-7B-v0.1-Q4_0.gguf
Normal file
3
Mamba-Codestral-7B-v0.1-Q4_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:611d2428116f248ea0715f4a4f9a6e2ba9d8007f69bcc9ae751d2ee5c260c146
|
||||
size 4147481664
|
||||
3
Mamba-Codestral-7B-v0.1-Q5_0.gguf
Normal file
3
Mamba-Codestral-7B-v0.1-Q5_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:970c01b43b97a7f32003a81d8ba6cc310324ea0917ee0254a45ab4f824a02be8
|
||||
size 5040868416
|
||||
3
Mamba-Codestral-7B-v0.1-Q6_K.gguf
Normal file
3
Mamba-Codestral-7B-v0.1-Q6_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:531521d9952bbd7c783ebce7443dda7b903a5f556c09a4e02d6069fe351b9ed7
|
||||
size 5990091840
|
||||
3
Mamba-Codestral-7B-v0.1-Q8_0.gguf
Normal file
3
Mamba-Codestral-7B-v0.1-Q8_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:e601d4ccfabfb109ddaf55712d72388a3778fcf03f8ecb613cf0094d5e0795ad
|
||||
size 7753534528
|
||||
66
README.md
Normal file
66
README.md
Normal file
@@ -0,0 +1,66 @@
|
||||
---
|
||||
license: apache-2.0
|
||||
base_model:
|
||||
- mistralai/Mamba-Codestral-7B-v0.1
|
||||
---
|
||||
## GGUF info:
|
||||
Original model didn't include chat template, im using the flag --chat-template mistral
|
||||
|
||||
Will probably re-do the GGUF files here later
|
||||
|
||||
|
||||
Original Readme:
|
||||
# Model Card for Mamba-Codestral-7B-v0.1
|
||||
|
||||
Codestral Mamba is an open code model based on the Mamba2 architecture. It performs on par with state-of-the-art Transformer-based code models. \
|
||||
You can read more in the [official blog post](https://mistral.ai/news/codestral-mamba/).
|
||||
|
||||
|
||||
## Installation
|
||||
|
||||
It is recommended to use `mistralai/Mamba-Codestral-7B-v0.1` with [mistral-inference](https://github.com/mistralai/mistral-inference)
|
||||
|
||||
|
||||
```
|
||||
pip install mistral_inference>=1 mamba-ssm causal-conv1d
|
||||
```
|
||||
|
||||
or directly with the original [`mamba`](https://github.com/state-spaces/mamba) package:
|
||||
|
||||
```
|
||||
pip install mamba_ssm causal-conv1d
|
||||
```
|
||||
|
||||
## Download
|
||||
|
||||
```py
|
||||
from huggingface_hub import snapshot_download
|
||||
from pathlib import Path
|
||||
mistral_models_path = Path.home().joinpath('mistral_models', 'Mamba-Codestral-7B-v0.1')
|
||||
mistral_models_path.mkdir(parents=True, exist_ok=True)
|
||||
snapshot_download(repo_id="mistralai/Mamba-Codestral-7B-v0.1", allow_patterns=["params.json", "consolidated.safetensors", "tokenizer.model.v3"], local_dir=mistral_models_path)
|
||||
```
|
||||
|
||||
### Chat
|
||||
|
||||
After installing `mistral_inference`, a `mistral-demo` CLI command should be available in your environment.
|
||||
|
||||
```
|
||||
mistral-chat $HOME/mistral_models/Mamba-Codestral-7B-v0.1 --instruct --max_tokens 256
|
||||
```
|
||||
|
||||
## Evaluation
|
||||
We evaluate Codestral Mamba, Codestral and open-weight models of similar size on industry-standard benchmarks.
|
||||
| Benchmarks | HumanEval | MBPP | Spider | CruxE | HumanEval C++ | HumanEvalJava |HumanEvalJS |HumanEval Bash |
|
||||
| :---: | :---: | :---: | :---: | :---: | :---: | :---: | :---: | :---: |
|
||||
| CodeGemma 1.1 7B | 61.0% | 67.7% | 46.3% | 50.4% | 49.1% | 41.8% | 52.2% | 9.4% |
|
||||
| CodeLlama 7B | 31.1% | 48.2% | 29.3% | 50.1% | 31.7% | 29.7% | 31.7% | 11.4% |
|
||||
| DeepSeek v1.5 7B | 65.9% | **70.8%** | **61.2%** | 55.5% | 59.0% | **62.7%** | 60.9% | **33.5%** |
|
||||
| **Codestral Mamba (7B)** | **75.0%** | 68.5% | 58.8% | **57.8%** | **59.8%** | 57.0% | **61.5%** | 31.1% |
|
||||
|
|
||||
| **Codestral (22B)** | **81.1%%** | **78.2%%** | **63.5%%** | 51.3% | **65.2%** | **63.3%** | - | **42.4%** |
|
||||
| CodeLlama 34B | 43.3% | 75.1% | 50.8% | 55.2% | 51.6% | 57.0% | 59.0% | 29.7% |
|
||||
|
||||
## The Mistral AI Team
|
||||
|
||||
Albert Jiang, Alexandre Sablayrolles, Alexis Tacnet, Alok Kothari, Antoine Roux, Arthur Mensch, Audrey Herblin-Stoop, Augustin Garreau, Austin Birky, Bam4d, Baptiste Bout, Baudouin de Monicault, Blanche Savary, Carole Rambaud, Caroline Feldman, Devendra Singh Chaplot, Diego de las Casas, Eleonore Arcelin, Emma Bou Hanna, Etienne Metzger, Gaspard Blanchet, Gianna Lengyel, Guillaume Bour, Guillaume Lample, Harizo Rajaona, Henri Roussez, Hichem Sattouf, Ian Mack, Jean-Malo Delignon, Jessica Chudnovsky, Justus Murke, Kartik Khandelwal, Lawrence Stewart, Louis Martin, Louis Ternon, Lucile Saulnier, Lélio Renard Lavaud, Margaret Jennings, Marie Pellat, Marie Torelli, Marie-Anne Lachaux, Marjorie Janiewicz, Mickaël Seznec, Nicolas Schuhl, Niklas Muhs, Olivier de Garrigues, Patrick von Platen, Paul Jacob, Pauline Buche, Pavan Kumar Reddy, Perry Savas, Pierre Stock, Romain Sauvestre, Sagar Vaze, Sandeep Subramanian, Saurabh Garg, Sophia Yang, Szymon Antoniak, Teven Le Scao, Thibault Schueller, Thibaut Lavril, Thomas Wang, Théophile Gervet, Timothée Lacroix, Valera Nemychnikova, Wendy Shang, William El Sayed, William Marshall
|
||||
Reference in New Issue
Block a user