初始化项目,由ModelHub XC社区提供模型
Model: cloudyu/mistral_28B_instruct_v0.2 Source: Original Platform
This commit is contained in:
35
.gitattributes
vendored
Normal file
35
.gitattributes
vendored
Normal file
@@ -0,0 +1,35 @@
|
|||||||
|
*.7z filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.arrow filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.bin filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.ftz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.gz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.h5 filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.joblib filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.model filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.npy filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.npz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.parquet filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pb filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pickle filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pkl filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pt filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pth filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.rar filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
||||||
|
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.tar filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.tflite filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.tgz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.wasm filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.xz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||||
23
README.md
Normal file
23
README.md
Normal file
@@ -0,0 +1,23 @@
|
|||||||
|
---
|
||||||
|
license: cc-by-4.0
|
||||||
|
---
|
||||||
|
```
|
||||||
|
this is a 128 layers model based on mistral architecture
|
||||||
|
DPO by Intel/orca_dpo_pairs.
|
||||||
|
template is "{instruction} {inputs} \n {output}"
|
||||||
|
```
|
||||||
|
|
||||||
|
example output
|
||||||
|
|
||||||
|
```
|
||||||
|
<s> write a story about yosemite.
|
||||||
|
Once upon a time, in the heart of California's Sierra Nevada Mountains, there was a land known as Yosemite National Park. This magical place was home to some of nature's most breathtaking wonders, from its towering redwood trees to its crystal clear streams and icy alpine lakes.
|
||||||
|
|
||||||
|
In this enchanted land lived a family of animals that called Yosemite their home. There were grizzly bears roaming free through the forests, while coyotes howled at the moon on clear night. A family of mules had made their home among the cliffs, while a group of rabbits danced and frolicked in the meadow.
|
||||||
|
|
||||||
|
One day, a young doe named Bella set out on an adventure to explore the wondrous landscapes of Yosemite. She followed the path of the river upstream, her eyes fixed on the top of the mountain where she could see the first glints of snow. As she climbed higher and higher, she met other animals on her journey - a family of foxes, a family of beavers, even a family of owls! They all shared stories of their adventures in Yosemite, and Bella listened with amazement.
|
||||||
|
|
||||||
|
Eventually, Bella reached the top of the mountain, where she was greeted by the most stunning view she had ever seen. Below her, the valley spread out like a green sea, filled with every kind of plant life and animal species. The sun set over the horizon, painting the sky in shades of pink and orange.
|
||||||
|
|
||||||
|
Bella knew that she would never forget this moment, or the magic of Yosemite. She took one last look before starting her journey back down the mountain, her heart filled with gratitude for the wonders of nature that surrounded her. From then on, Bella explored Yosemite every day, always finding something new and amazing around every corner. And so it continued, year after year, as Yosemite remained a land of magic and wonder, a paradise for all who dared to explore its secrets.</s>
|
||||||
|
```
|
||||||
26
config.json
Normal file
26
config.json
Normal file
@@ -0,0 +1,26 @@
|
|||||||
|
{
|
||||||
|
"_name_or_path": "./28B",
|
||||||
|
"architectures": [
|
||||||
|
"MistralForCausalLM"
|
||||||
|
],
|
||||||
|
"attention_dropout": 0.0,
|
||||||
|
"bos_token_id": 1,
|
||||||
|
"eos_token_id": 2,
|
||||||
|
"hidden_act": "silu",
|
||||||
|
"hidden_size": 4096,
|
||||||
|
"initializer_range": 0.02,
|
||||||
|
"intermediate_size": 14336,
|
||||||
|
"max_position_embeddings": 32768,
|
||||||
|
"model_type": "mistral",
|
||||||
|
"num_attention_heads": 32,
|
||||||
|
"num_hidden_layers": 128,
|
||||||
|
"num_key_value_heads": 8,
|
||||||
|
"rms_norm_eps": 1e-05,
|
||||||
|
"rope_theta": 1000000.0,
|
||||||
|
"sliding_window": null,
|
||||||
|
"tie_word_embeddings": false,
|
||||||
|
"torch_dtype": "bfloat16",
|
||||||
|
"transformers_version": "4.38.2",
|
||||||
|
"use_cache": true,
|
||||||
|
"vocab_size": 32000
|
||||||
|
}
|
||||||
6
generation_config.json
Normal file
6
generation_config.json
Normal file
@@ -0,0 +1,6 @@
|
|||||||
|
{
|
||||||
|
"_from_model_config": true,
|
||||||
|
"bos_token_id": 1,
|
||||||
|
"eos_token_id": 2,
|
||||||
|
"transformers_version": "4.38.2"
|
||||||
|
}
|
||||||
3
model-00001-of-00012.safetensors
Normal file
3
model-00001-of-00012.safetensors
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:fa97d22b448b8aa3c676ad50b683b11cf62a7185ea9bdcbdd676e6c3a9c9920a
|
||||||
|
size 4943162336
|
||||||
3
model-00002-of-00012.safetensors
Normal file
3
model-00002-of-00012.safetensors
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:368d51e65c23b1f988634d9ed9318ff5e3d20b9c8cb352c2534dd510cabdec61
|
||||||
|
size 4999819336
|
||||||
3
model-00003-of-00012.safetensors
Normal file
3
model-00003-of-00012.safetensors
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:f48d23f5716270a037134014a47880c10114c93c2cca7ecf8c53804103c630ad
|
||||||
|
size 4915916184
|
||||||
3
model-00004-of-00012.safetensors
Normal file
3
model-00004-of-00012.safetensors
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:704a0b00c9d793cb5f3f6c94b5349458207fede86a7dd383b67ecf69b3a8179e
|
||||||
|
size 4915916176
|
||||||
3
model-00005-of-00012.safetensors
Normal file
3
model-00005-of-00012.safetensors
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:91f12525f2ad00d94f0ee460756fe6fdfa8d67ef025a9d7bd357d89045176602
|
||||||
|
size 4999819336
|
||||||
3
model-00006-of-00012.safetensors
Normal file
3
model-00006-of-00012.safetensors
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:2fe1d8581da6de03d6d4972063f133a8fa0e6bc0290b6ef4da362ab1ad5d121e
|
||||||
|
size 4915916184
|
||||||
3
model-00007-of-00012.safetensors
Normal file
3
model-00007-of-00012.safetensors
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:c22e21eb620b5afff5af8d0b7953b92e30eced778b671a6df69a6713f78bf675
|
||||||
|
size 4915916176
|
||||||
3
model-00008-of-00012.safetensors
Normal file
3
model-00008-of-00012.safetensors
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:c08a318f27cad7331fdabe3d3a39a49a52021539e772813c733d035bc9276b82
|
||||||
|
size 4999819336
|
||||||
3
model-00009-of-00012.safetensors
Normal file
3
model-00009-of-00012.safetensors
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:1f6a2ee613c8a517c1578f7cca646947e502533162dd2932e3b7dc1b3cccbf89
|
||||||
|
size 4915916184
|
||||||
3
model-00010-of-00012.safetensors
Normal file
3
model-00010-of-00012.safetensors
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:7ca366ab92987d8bf943145d8872365a45a5ade0e4cd784a8432faafd87d8887
|
||||||
|
size 4915916280
|
||||||
3
model-00011-of-00012.safetensors
Normal file
3
model-00011-of-00012.safetensors
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:ece70d167c858ee0432725715b2bfebc4b79104d57ec6fe86df0a88ce956688f
|
||||||
|
size 4999819448
|
||||||
3
model-00012-of-00012.safetensors
Normal file
3
model-00012-of-00012.safetensors
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:f45663bb1622acf9b340c942206fe4f9077a1fd980d0bca1e69f3c7bf1169b5e
|
||||||
|
size 1923166072
|
||||||
1162
model.safetensors.index.json
Normal file
1162
model.safetensors.index.json
Normal file
File diff suppressed because it is too large
Load Diff
30
special_tokens_map.json
Normal file
30
special_tokens_map.json
Normal file
@@ -0,0 +1,30 @@
|
|||||||
|
{
|
||||||
|
"bos_token": {
|
||||||
|
"content": "<s>",
|
||||||
|
"lstrip": false,
|
||||||
|
"normalized": false,
|
||||||
|
"rstrip": false,
|
||||||
|
"single_word": false
|
||||||
|
},
|
||||||
|
"eos_token": {
|
||||||
|
"content": "</s>",
|
||||||
|
"lstrip": false,
|
||||||
|
"normalized": false,
|
||||||
|
"rstrip": false,
|
||||||
|
"single_word": false
|
||||||
|
},
|
||||||
|
"pad_token": {
|
||||||
|
"content": "</s>",
|
||||||
|
"lstrip": false,
|
||||||
|
"normalized": false,
|
||||||
|
"rstrip": false,
|
||||||
|
"single_word": false
|
||||||
|
},
|
||||||
|
"unk_token": {
|
||||||
|
"content": "<unk>",
|
||||||
|
"lstrip": false,
|
||||||
|
"normalized": false,
|
||||||
|
"rstrip": false,
|
||||||
|
"single_word": false
|
||||||
|
}
|
||||||
|
}
|
||||||
91127
tokenizer.json
Normal file
91127
tokenizer.json
Normal file
File diff suppressed because it is too large
Load Diff
BIN
tokenizer.model
(Stored with Git LFS)
Normal file
BIN
tokenizer.model
(Stored with Git LFS)
Normal file
Binary file not shown.
47
tokenizer_config.json
Normal file
47
tokenizer_config.json
Normal file
@@ -0,0 +1,47 @@
|
|||||||
|
{
|
||||||
|
"add_bos_token": true,
|
||||||
|
"add_eos_token": false,
|
||||||
|
"added_tokens_decoder": {
|
||||||
|
"0": {
|
||||||
|
"content": "<unk>",
|
||||||
|
"lstrip": false,
|
||||||
|
"normalized": false,
|
||||||
|
"rstrip": false,
|
||||||
|
"single_word": false,
|
||||||
|
"special": true
|
||||||
|
},
|
||||||
|
"1": {
|
||||||
|
"content": "<s>",
|
||||||
|
"lstrip": false,
|
||||||
|
"normalized": false,
|
||||||
|
"rstrip": false,
|
||||||
|
"single_word": false,
|
||||||
|
"special": true
|
||||||
|
},
|
||||||
|
"2": {
|
||||||
|
"content": "</s>",
|
||||||
|
"lstrip": false,
|
||||||
|
"normalized": false,
|
||||||
|
"rstrip": false,
|
||||||
|
"single_word": false,
|
||||||
|
"special": true
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"additional_special_tokens": [],
|
||||||
|
"bos_token": "<s>",
|
||||||
|
"chat_template": "{{ bos_token }}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if message['role'] == 'user' %}{{ '[INST] ' + message['content'] + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ message['content'] + eos_token}}{% else %}{{ raise_exception('Only user and assistant roles are supported!') }}{% endif %}{% endfor %}",
|
||||||
|
"clean_up_tokenization_spaces": false,
|
||||||
|
"eos_token": "</s>",
|
||||||
|
"legacy": true,
|
||||||
|
"max_length": 4096,
|
||||||
|
"model_max_length": 1000000000000000019884624838656,
|
||||||
|
"pad_token": "</s>",
|
||||||
|
"sp_model_kwargs": {},
|
||||||
|
"spaces_between_special_tokens": false,
|
||||||
|
"stride": 0,
|
||||||
|
"tokenizer_class": "LlamaTokenizer",
|
||||||
|
"truncation_side": "right",
|
||||||
|
"truncation_strategy": "longest_first",
|
||||||
|
"unk_token": "<unk>",
|
||||||
|
"use_default_system_prompt": false
|
||||||
|
}
|
||||||
Reference in New Issue
Block a user