初始化项目,由ModelHub XC社区提供模型
Model: gaianet/Llama-3_1-Nemotron-51B-Instruct-GGUF Source: Original Platform
This commit is contained in:
52
.gitattributes
vendored
Normal file
52
.gitattributes
vendored
Normal file
@@ -0,0 +1,52 @@
|
||||
*.7z filter=lfs diff=lfs merge=lfs -text
|
||||
*.arrow filter=lfs diff=lfs merge=lfs -text
|
||||
*.bin filter=lfs diff=lfs merge=lfs -text
|
||||
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
||||
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
||||
*.ftz filter=lfs diff=lfs merge=lfs -text
|
||||
*.gz filter=lfs diff=lfs merge=lfs -text
|
||||
*.h5 filter=lfs diff=lfs merge=lfs -text
|
||||
*.joblib filter=lfs diff=lfs merge=lfs -text
|
||||
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
||||
*.model filter=lfs diff=lfs merge=lfs -text
|
||||
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||
*.npy filter=lfs diff=lfs merge=lfs -text
|
||||
*.npz filter=lfs diff=lfs merge=lfs -text
|
||||
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||
*.parquet filter=lfs diff=lfs merge=lfs -text
|
||||
*.pb filter=lfs diff=lfs merge=lfs -text
|
||||
*.pickle filter=lfs diff=lfs merge=lfs -text
|
||||
*.pkl filter=lfs diff=lfs merge=lfs -text
|
||||
*.pt filter=lfs diff=lfs merge=lfs -text
|
||||
*.pth filter=lfs diff=lfs merge=lfs -text
|
||||
*.rar filter=lfs diff=lfs merge=lfs -text
|
||||
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
||||
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar filter=lfs diff=lfs merge=lfs -text
|
||||
*.tflite filter=lfs diff=lfs merge=lfs -text
|
||||
*.tgz filter=lfs diff=lfs merge=lfs -text
|
||||
*.wasm filter=lfs diff=lfs merge=lfs -text
|
||||
*.xz filter=lfs diff=lfs merge=lfs -text
|
||||
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-3_1-Nemotron-51B-Instruct-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-3_1-Nemotron-51B-Instruct-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-3_1-Nemotron-51B-Instruct-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-3_1-Nemotron-51B-Instruct-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-3_1-Nemotron-51B-Instruct-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-3_1-Nemotron-51B-Instruct-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-3_1-Nemotron-51B-Instruct-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-3_1-Nemotron-51B-Instruct-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-3_1-Nemotron-51B-Instruct-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-3_1-Nemotron-51B-Instruct-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-3_1-Nemotron-51B-Instruct-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-3_1-Nemotron-51B-Instruct-Q8_0-00001-of-00002.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-3_1-Nemotron-51B-Instruct-Q8_0-00002-of-00002.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-3_1-Nemotron-51B-Instruct-f16-00001-of-00004.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-3_1-Nemotron-51B-Instruct-f16-00002-of-00004.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-3_1-Nemotron-51B-Instruct-f16-00003-of-00004.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-3_1-Nemotron-51B-Instruct-f16-00004-of-00004.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
3
Llama-3_1-Nemotron-51B-Instruct-Q2_K.gguf
Normal file
3
Llama-3_1-Nemotron-51B-Instruct-Q2_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:1f1d6ad4df6fa589194203235d19bb31315cd73beb3ed2dffb02a6eb1d404ac9
|
||||
size 19418642464
|
||||
3
Llama-3_1-Nemotron-51B-Instruct-Q3_K_L.gguf
Normal file
3
Llama-3_1-Nemotron-51B-Instruct-Q3_K_L.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:cbe29ae0b25627ac8631a34ca6f11d572ae4a0bd6c1f8650f960a0faf7fe69b0
|
||||
size 27349751840
|
||||
3
Llama-3_1-Nemotron-51B-Instruct-Q3_K_M.gguf
Normal file
3
Llama-3_1-Nemotron-51B-Instruct-Q3_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:e8595b234baa5fc3dc14db611793cedcdb3ab73bcc421bacc46a15a4ba6bb57b
|
||||
size 25182345248
|
||||
3
Llama-3_1-Nemotron-51B-Instruct-Q3_K_S.gguf
Normal file
3
Llama-3_1-Nemotron-51B-Instruct-Q3_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:ef2b0a9330eafc8fb6cde9285e7cd1c9b9a081e4ecd68f02fcb8e3b1459eaa68
|
||||
size 22652393504
|
||||
3
Llama-3_1-Nemotron-51B-Instruct-Q4_0.gguf
Normal file
3
Llama-3_1-Nemotron-51B-Instruct-Q4_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:624711249056e4dc79bda0090015f3ed0a44fe7ca35a2a91579efe90b92908aa
|
||||
size 29252368416
|
||||
3
Llama-3_1-Nemotron-51B-Instruct-Q4_K_M.gguf
Normal file
3
Llama-3_1-Nemotron-51B-Instruct-Q4_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:db50b770b4cc7918f1a25f204609c4c478e41c2f10499ec900259cb052948c11
|
||||
size 31037306912
|
||||
3
Llama-3_1-Nemotron-51B-Instruct-Q4_K_S.gguf
Normal file
3
Llama-3_1-Nemotron-51B-Instruct-Q4_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:041d5660e8f40b1fe28c65c522e92814cb855426187aae81ca9359ca10e46df5
|
||||
size 29484496928
|
||||
3
Llama-3_1-Nemotron-51B-Instruct-Q5_0.gguf
Normal file
3
Llama-3_1-Nemotron-51B-Instruct-Q5_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:7f6baa9e8ba28870f76093655dcf04b9a4439a8edf4b51efc4725c44684d1c24
|
||||
size 35558504480
|
||||
3
Llama-3_1-Nemotron-51B-Instruct-Q5_K_M.gguf
Normal file
3
Llama-3_1-Nemotron-51B-Instruct-Q5_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:9e19d5f2172cb51bcb3dd22391cebaf4c7f0210c562200ae671d8640e115de36
|
||||
size 36465391648
|
||||
3
Llama-3_1-Nemotron-51B-Instruct-Q5_K_S.gguf
Normal file
3
Llama-3_1-Nemotron-51B-Instruct-Q5_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:906aefa4926bec89d3aff281db866bb02e4ed79792566b28cc3d6a8bebcb5c79
|
||||
size 35558504480
|
||||
3
Llama-3_1-Nemotron-51B-Instruct-Q6_K.gguf
Normal file
3
Llama-3_1-Nemotron-51B-Instruct-Q6_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:8d66d3daee89d9e2596841f3589b3268ef060aef1513070a5ce390ce00adf12f
|
||||
size 42258774048
|
||||
3
Llama-3_1-Nemotron-51B-Instruct-Q8_0-00001-of-00002.gguf
Normal file
3
Llama-3_1-Nemotron-51B-Instruct-Q8_0-00001-of-00002.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:4ed2a1ad93790fcfe630e5755f5ce18d9fd7a04808e36343f3b000bde61ffa55
|
||||
size 29826134528
|
||||
3
Llama-3_1-Nemotron-51B-Instruct-Q8_0-00002-of-00002.gguf
Normal file
3
Llama-3_1-Nemotron-51B-Instruct-Q8_0-00002-of-00002.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:f20fc51b96935e0e17daee28f9694ef85cc7f66faabf3ea0d2a5f126e958fbf9
|
||||
size 24905238240
|
||||
3
Llama-3_1-Nemotron-51B-Instruct-f16-00001-of-00004.gguf
Normal file
3
Llama-3_1-Nemotron-51B-Instruct-f16-00001-of-00004.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:c29966a7c3b2172525e4b9b29de9391ac1507476e26ae09486fb0953501c5c47
|
||||
size 29772092192
|
||||
3
Llama-3_1-Nemotron-51B-Instruct-f16-00002-of-00004.gguf
Normal file
3
Llama-3_1-Nemotron-51B-Instruct-f16-00002-of-00004.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:67d59882c28b27005f0551e3ece2e49c37a9096022f08b1cb228f8cefc09e75c
|
||||
size 29562578048
|
||||
3
Llama-3_1-Nemotron-51B-Instruct-f16-00003-of-00004.gguf
Normal file
3
Llama-3_1-Nemotron-51B-Instruct-f16-00003-of-00004.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:534c2dd1ee26a2fbf3979582b0fdafa9bd01e9d3f0eb7d78a506ab10f5bb0897
|
||||
size 29596988128
|
||||
3
Llama-3_1-Nemotron-51B-Instruct-f16-00004-of-00004.gguf
Normal file
3
Llama-3_1-Nemotron-51B-Instruct-f16-00004-of-00004.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:82558d958d66febc358278b3c96b4479e2c002dd4b7babe49cbf111cc05813f3
|
||||
size 14080741216
|
||||
42
README.md
Normal file
42
README.md
Normal file
@@ -0,0 +1,42 @@
|
||||
---
|
||||
base_model: nvidia/Llama-3_1-Nemotron-51B-Instruct
|
||||
license: other
|
||||
license_name: nvidia-open-model-license
|
||||
license_link: >-
|
||||
https://developer.download.nvidia.com/licenses/nvidia-open-model-license-agreement-june-2024.pdf
|
||||
model_creator: tiiuae
|
||||
model_name: Llama-3_1-Nemotron-51B-Instruct
|
||||
quantized_by: Second State Inc.
|
||||
library_name: transformers
|
||||
pipeline_tag: text-generation
|
||||
language:
|
||||
- en
|
||||
tags:
|
||||
- nvidia
|
||||
- llama-3
|
||||
- pytorch
|
||||
---
|
||||
|
||||
# Llama-3_1-Nemotron-51B-Instruct-GGUF
|
||||
|
||||
## Original Model
|
||||
|
||||
[nvidia/Llama-3_1-Nemotron-51B-Instruct](https://huggingface.co/nvidia/Llama-3_1-Nemotron-51B-Instruct)
|
||||
|
||||
## Run with Gaianet
|
||||
|
||||
**Prompt template:**
|
||||
|
||||
prompt template: `llama-3-chat`
|
||||
|
||||
**Context size:**
|
||||
|
||||
chat_ctx_size: `8192`
|
||||
|
||||
**Run with GaiaNet:**
|
||||
|
||||
- Quick start: https://docs.gaianet.ai/node-guide/quick-start
|
||||
|
||||
- Customize your node: https://docs.gaianet.ai/node-guide/customize
|
||||
|
||||
*Quantized with llama.cpp b4381*
|
||||
1004
config.json
Normal file
1004
config.json
Normal file
File diff suppressed because it is too large
Load Diff
Reference in New Issue
Block a user