初始化项目,由ModelHub XC社区提供模型

Model: cloudyu/mistral_28B_instruct_v0.1
Source: Original Platform
This commit is contained in:
ModelHub XC
2026-04-10 21:14:03 +08:00
commit afc17bc533
21 changed files with 92500 additions and 0 deletions

35
.gitattributes vendored Normal file
View File

@@ -0,0 +1,35 @@
*.7z filter=lfs diff=lfs merge=lfs -text
*.arrow filter=lfs diff=lfs merge=lfs -text
*.bin filter=lfs diff=lfs merge=lfs -text
*.bz2 filter=lfs diff=lfs merge=lfs -text
*.ckpt filter=lfs diff=lfs merge=lfs -text
*.ftz filter=lfs diff=lfs merge=lfs -text
*.gz filter=lfs diff=lfs merge=lfs -text
*.h5 filter=lfs diff=lfs merge=lfs -text
*.joblib filter=lfs diff=lfs merge=lfs -text
*.lfs.* filter=lfs diff=lfs merge=lfs -text
*.mlmodel filter=lfs diff=lfs merge=lfs -text
*.model filter=lfs diff=lfs merge=lfs -text
*.msgpack filter=lfs diff=lfs merge=lfs -text
*.npy filter=lfs diff=lfs merge=lfs -text
*.npz filter=lfs diff=lfs merge=lfs -text
*.onnx filter=lfs diff=lfs merge=lfs -text
*.ot filter=lfs diff=lfs merge=lfs -text
*.parquet filter=lfs diff=lfs merge=lfs -text
*.pb filter=lfs diff=lfs merge=lfs -text
*.pickle filter=lfs diff=lfs merge=lfs -text
*.pkl filter=lfs diff=lfs merge=lfs -text
*.pt filter=lfs diff=lfs merge=lfs -text
*.pth filter=lfs diff=lfs merge=lfs -text
*.rar filter=lfs diff=lfs merge=lfs -text
*.safetensors filter=lfs diff=lfs merge=lfs -text
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.tar.* filter=lfs diff=lfs merge=lfs -text
*.tar filter=lfs diff=lfs merge=lfs -text
*.tflite filter=lfs diff=lfs merge=lfs -text
*.tgz filter=lfs diff=lfs merge=lfs -text
*.wasm filter=lfs diff=lfs merge=lfs -text
*.xz filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text

28
README.md Normal file
View File

@@ -0,0 +1,28 @@
---
license: cc-by-4.0
---
```
this is a 128 layers model based on mistral architecture
sft by vicgalle/alpaca-gpt4.
template is "{instruction} {inputs} \n {output}"
```
example output
```
<s> write a story about new yrok city.
Once upon a time, in the heart of the United States, there was a city known as New York City. It was a bustling metropolis, teeming with people from all walks of life. The streets were alive with energy and excitement, as people went about their daily routines, working hard to make ends meet.
The city was a melting pot of cultures, where people from all over the world had come to start anew. They brought with them their traditions, their customs, and their dreams, creating a unique tapestry that made up the very essence of New York City.
One day, as the sun set over the skyscrapers, a young woman named Maya stepped off the subway, her eyes wide with wonder. She had just moved to the city from a small town in the midwest, and she couldn't believe her luck at having landed a job as a journalist for one of the biggest news organizations in the city.
As she made her way through the crowded streets, she took in everything around her - the sounds of horns honking, the smells of street food, the sight of people from all races and ethnicities living side by side. It was a world unlike anything she had ever experienced before, and it both excited and scared her.
Maya soon found herself immersed in the fast-paced world of journalism, reporting on everything from local events to national news. She worked long hours, but she loved every moment of it. She had finally found her place in the world, and she knew that this was only the beginning of her journey.
Over the next few years, Maya continued to explore the city, uncovering its secrets and sharing its stories with the world. She met people from all walks of life, each one leaving an indelible mark on her heart.
And even as the city changed and grew, Maya remained forever enchanted by its magic. For she had discovered something truly special about New York City: no matter how big or bright the world became, it would always be her home.</s>
```

26
config.json Normal file
View File

@@ -0,0 +1,26 @@
{
"_name_or_path": "./mistral_28B",
"architectures": [
"MistralForCausalLM"
],
"attention_dropout": 0.0,
"bos_token_id": 1,
"eos_token_id": 2,
"hidden_act": "silu",
"hidden_size": 4096,
"initializer_range": 0.02,
"intermediate_size": 14336,
"max_position_embeddings": 32768,
"model_type": "mistral",
"num_attention_heads": 32,
"num_hidden_layers": 128,
"num_key_value_heads": 8,
"rms_norm_eps": 1e-05,
"rope_theta": 1000000.0,
"sliding_window": null,
"tie_word_embeddings": false,
"torch_dtype": "bfloat16",
"transformers_version": "4.38.2",
"use_cache": true,
"vocab_size": 32000
}

6
generation_config.json Normal file
View File

@@ -0,0 +1,6 @@
{
"_from_model_config": true,
"bos_token_id": 1,
"eos_token_id": 2,
"transformers_version": "4.38.2"
}

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:599258c85199df90f982d797b0e3f8f67cfdccac129331fe8f665ab7d10d4c06
size 4943162336

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:292af297680303681fd4eeb78d84e607bfa2205215e5f58ef22e717d91628ab4
size 4999819336

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:1ca288cf374ec1f73f897b3c834edf09b6500df614d0fd7da9a164841bec811b
size 4915916184

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:e6acedac9365468a8d035e7fe91f513ffba16a839e59e73577d010d8550fb228
size 4915916176

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:497b0d6d4635e9db2f17f3d833e6825026e694632a14191b630f380e073055a0
size 4999819336

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:f7b963b5bc6121b13330ec925ff9f4ba188238f4a309cfc808d8d5e62e242493
size 4915916184

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:a20230934896ab092432e26c6cb244c5acfaf2ab2429dde59fb64797f7773f86
size 4915916176

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:c15585bd3bd5dc52dd82f429bfcea36e17245feaa42ea525b8863d3517371051
size 4999819336

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:d398e0af3d4a08c2b7aa9c43af8cfdb9aecef0ea34ce94e683ef5819ccd26ea1
size 4915916184

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:939e7aa5bdbd107cfde42bfac1b27d4c8094682f0c8723e693fd4caa93789ffe
size 4915916280

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:30d8939146144ccc84bcb172b3140835e7b8ccdf9295c1604144483c88c0e1b9
size 4999819448

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:5bacf84a25873f6a12934a13e31f51a206cb3969c0b203f2b3953502ee61dd97
size 1923166072

1162
model.safetensors.index.json Normal file

File diff suppressed because it is too large Load Diff

30
special_tokens_map.json Normal file
View File

@@ -0,0 +1,30 @@
{
"bos_token": {
"content": "<s>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false
},
"eos_token": {
"content": "</s>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false
},
"pad_token": {
"content": "</s>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false
},
"unk_token": {
"content": "<unk>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false
}
}

91127
tokenizer.json Normal file

File diff suppressed because it is too large Load Diff

BIN
tokenizer.model (Stored with Git LFS) Normal file

Binary file not shown.

47
tokenizer_config.json Normal file
View File

@@ -0,0 +1,47 @@
{
"add_bos_token": true,
"add_eos_token": false,
"added_tokens_decoder": {
"0": {
"content": "<unk>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"1": {
"content": "<s>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2": {
"content": "</s>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
}
},
"additional_special_tokens": [],
"bos_token": "<s>",
"chat_template": "{{ bos_token }}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if message['role'] == 'user' %}{{ '[INST] ' + message['content'] + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ message['content'] + eos_token}}{% else %}{{ raise_exception('Only user and assistant roles are supported!') }}{% endif %}{% endfor %}",
"clean_up_tokenization_spaces": false,
"eos_token": "</s>",
"legacy": true,
"max_length": 4096,
"model_max_length": 1000000000000000019884624838656,
"pad_token": "</s>",
"sp_model_kwargs": {},
"spaces_between_special_tokens": false,
"stride": 0,
"tokenizer_class": "LlamaTokenizer",
"truncation_side": "right",
"truncation_strategy": "longest_first",
"unk_token": "<unk>",
"use_default_system_prompt": false
}