commit 83b7339b4e00c454b078a46741de35efeec3b98c Author: ModelHub XC Date: Tue Apr 21 17:13:38 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: cortexso/deepseek-r1-distill-qwen-1.5b Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..6bb177a --- /dev/null +++ b/.gitattributes @@ -0,0 +1,45 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +deepseek-r1-distill-qwen-1.5b-q2_k.gguf filter=lfs diff=lfs merge=lfs -text +deepseek-r1-distill-qwen-1.5b-q3_k_l.gguf filter=lfs diff=lfs merge=lfs -text +deepseek-r1-distill-qwen-1.5b-q3_k_m.gguf filter=lfs diff=lfs merge=lfs -text +deepseek-r1-distill-qwen-1.5b-q3_k_s.gguf filter=lfs diff=lfs merge=lfs -text +deepseek-r1-distill-qwen-1.5b-q4_k_m.gguf filter=lfs diff=lfs merge=lfs -text +deepseek-r1-distill-qwen-1.5b-q4_k_s.gguf filter=lfs diff=lfs merge=lfs -text +deepseek-r1-distill-qwen-1.5b-q5_k_m.gguf filter=lfs diff=lfs merge=lfs -text +deepseek-r1-distill-qwen-1.5b-q5_k_s.gguf filter=lfs diff=lfs merge=lfs -text +deepseek-r1-distill-qwen-1.5b-q6_k.gguf filter=lfs diff=lfs merge=lfs -text +deepseek-r1-distill-qwen-1.5b-q8_0.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..a79e4fd --- /dev/null +++ b/README.md @@ -0,0 +1,39 @@ +--- +license: mit +pipeline_tag: text-generation +tags: +- cortex.cpp +--- +## Overview + +**DeepSeek** developed and released the [DeepSeek R1 Distill Qwen 1.5B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B) model, a distilled version of the Qwen 1.5B language model. It is fine-tuned for high-performance text generation and optimized for dialogue and information-seeking tasks. This model achieves a balance of efficiency and accuracy while maintaining a smaller footprint compared to the original Qwen 1.5B. + +The model is designed for applications in customer support, conversational AI, and research, prioritizing both helpfulness and safety. + +## Variants + +| No | Variant | Cortex CLI command | +| --- | --- | --- | +| 1 | [Deepseek-r1-distill-qwen-1.5b-1.5b](https://huggingface.co/cortexso/deepseek-r1-distill-qwen-1.5b/tree/1.5b) | `cortex run deepseek-r1-distill-qwen-1.5b:1.5b` | + + +## Use it with Jan (UI) + +1. Install **Jan** using [Quickstart](https://jan.ai/docs/quickstart) +2. Use in Jan model Hub: + ```bash + cortexso/deepseek-r1-distill-qwen-1.5b + ``` +## Use it with Cortex (CLI) + +1. Install **Cortex** using [Quickstart](https://cortex.jan.ai/docs/quickstart) +2. Run the model with command: + ```bash + cortex run deepseek-r1-distill-qwen-1.5b + ``` +## Credits + +- **Author:** DeepSeek +- **Converter:** [Homebrew](https://www.homebrew.ltd/) +- **Original License:** [License](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B#7-license) +- **Papers:** [DeepSeek-R1: Incentivizing Reasoning Capability in LLMs via Reinforcement Learning](https://arxiv.org/html/2501.12948v1) \ No newline at end of file diff --git a/deepseek-r1-distill-qwen-1.5b-q2_k.gguf b/deepseek-r1-distill-qwen-1.5b-q2_k.gguf new file mode 100644 index 0000000..dd73caf --- /dev/null +++ b/deepseek-r1-distill-qwen-1.5b-q2_k.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0158a03fb9d3d9eb701b02b2a3d6006fbf2c42ef74c91fc01ca44b34e412d0e +size 752879904 diff --git a/deepseek-r1-distill-qwen-1.5b-q3_k_l.gguf b/deepseek-r1-distill-qwen-1.5b-q3_k_l.gguf new file mode 100644 index 0000000..972d530 --- /dev/null +++ b/deepseek-r1-distill-qwen-1.5b-q3_k_l.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65cb42bade66e46ba90bf43a0165883c263de32f0d0a1d67b03c694f3b8bceb5 +size 980439840 diff --git a/deepseek-r1-distill-qwen-1.5b-q3_k_m.gguf b/deepseek-r1-distill-qwen-1.5b-q3_k_m.gguf new file mode 100644 index 0000000..f62d800 --- /dev/null +++ b/deepseek-r1-distill-qwen-1.5b-q3_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9235d49e507ef970d54784f905a3d5892ae3386ae726ad6840c392ae559cca73 +size 924455712 diff --git a/deepseek-r1-distill-qwen-1.5b-q3_k_s.gguf b/deepseek-r1-distill-qwen-1.5b-q3_k_s.gguf new file mode 100644 index 0000000..d807e6a --- /dev/null +++ b/deepseek-r1-distill-qwen-1.5b-q3_k_s.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c8a514f11865245b4d80f74d8314d31f1c165105ab9e989e87c59d98d4246d4 +size 861221664 diff --git a/deepseek-r1-distill-qwen-1.5b-q4_k_m.gguf b/deepseek-r1-distill-qwen-1.5b-q4_k_m.gguf new file mode 100644 index 0000000..eefcf93 --- /dev/null +++ b/deepseek-r1-distill-qwen-1.5b-q4_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c47e9cc3399de9403f11a206ed59dcef2f9f8889eff71ed6f5a92a1b84453f1 +size 1117320480 diff --git a/deepseek-r1-distill-qwen-1.5b-q4_k_s.gguf b/deepseek-r1-distill-qwen-1.5b-q4_k_s.gguf new file mode 100644 index 0000000..0f160ac --- /dev/null +++ b/deepseek-r1-distill-qwen-1.5b-q4_k_s.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59500a4a0625421cb3cca5d0c09a30e5f50b56130d765bad57b682ad9fdde951 +size 1071584544 diff --git a/deepseek-r1-distill-qwen-1.5b-q5_k_m.gguf b/deepseek-r1-distill-qwen-1.5b-q5_k_m.gguf new file mode 100644 index 0000000..2fcde7c --- /dev/null +++ b/deepseek-r1-distill-qwen-1.5b-q5_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6faad9e18a4d5d59852bf58b81e3a7a704b6f0712786ce683d473751474ae967 +size 1285494048 diff --git a/deepseek-r1-distill-qwen-1.5b-q5_k_s.gguf b/deepseek-r1-distill-qwen-1.5b-q5_k_s.gguf new file mode 100644 index 0000000..0a54ca3 --- /dev/null +++ b/deepseek-r1-distill-qwen-1.5b-q5_k_s.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bfa62baa1a976bdb236a0e1e970f085cc19ec6c374206865f756fb7ce39367f +size 1259173152 diff --git a/deepseek-r1-distill-qwen-1.5b-q6_k.gguf b/deepseek-r1-distill-qwen-1.5b-q6_k.gguf new file mode 100644 index 0000000..e92b10e --- /dev/null +++ b/deepseek-r1-distill-qwen-1.5b-q6_k.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa21e354d44b210e30100730676e81ed17d7c8f003307a327e4713e764099d7b +size 1464178464 diff --git a/deepseek-r1-distill-qwen-1.5b-q8_0.gguf b/deepseek-r1-distill-qwen-1.5b-q8_0.gguf new file mode 100644 index 0000000..8a48e63 --- /dev/null +++ b/deepseek-r1-distill-qwen-1.5b-q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6529f4b51da8765ecf67d2b94c3749e5f78ea86ae720e6504c0e7b50f384cb7d +size 1894531872 diff --git a/metadata.yml b/metadata.yml new file mode 100644 index 0000000..adf3c81 --- /dev/null +++ b/metadata.yml @@ -0,0 +1,4 @@ +version: 1 +name: deepseek-r1-distill-qwen-1.5b +default: 1.5b +author: "DeepSeek-AI" diff --git a/model.yml b/model.yml new file mode 100644 index 0000000..b3dd18b --- /dev/null +++ b/model.yml @@ -0,0 +1,49 @@ +# BEGIN GENERAL GGUF METADATA +id: deepseek-r1-distill-qwen-1.5b +model: deepseek-r1-distill-qwen-1.5b +name: deepseek-r1-distill-qwen-1.5b +version: 1 +# END GENERAL GGUF METADATA + +# BEGIN INFERENCE PARAMETERS +# BEGIN REQUIRED +stop: +- <|im_end|> +- "<\uFF5Cend\u2581of\u2581sentence\uFF5C>" +# END REQUIRED + +# BEGIN OPTIONAL +stream: true +top_p: 0.9 +temperature: 0.7 +frequency_penalty: 0 +presence_penalty: 0 +max_tokens: 4096 +seed: -1 +dynatemp_range: 0 +dynatemp_exponent: 1 +top_k: 40 +min_p: 0.05 +tfs_z: 1 +typ_p: 1 +repeat_last_n: 64 +repeat_penalty: 1 +mirostat: false +mirostat_tau: 5 +mirostat_eta: 0.100000001 +penalize_nl: false +ignore_eos: false +n_probs: 0 +min_keep: 0 +# END OPTIONAL +# END INFERENCE PARAMETERS + +# BEGIN MODEL LOAD PARAMETERS +# BEGIN REQUIRED +engine: llama-cpp +prompt_template: "|start_of_text|>{system_message}<\uFF5CUser\uFF5C>{prompt}<\uFF5C\ + Assistant\uFF5C>" +ctx_len: 4096 +ngl: 29 +# END REQUIRED +# END MODEL LOAD PARAMETERS