初始化项目,由ModelHub XC社区提供模型
Model: DanielClough/Candle_Snorkel-Mistral-PairRM-DPO Source: Original Platform
This commit is contained in:
36
.gitattributes
vendored
Normal file
36
.gitattributes
vendored
Normal file
@@ -0,0 +1,36 @@
|
|||||||
|
*.7z filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.arrow filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.bin filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.ftz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.gz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.h5 filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.joblib filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.model filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.npy filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.npz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.parquet filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pb filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pickle filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pkl filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pt filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pth filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.rar filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
||||||
|
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.tar filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.tflite filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.tgz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.wasm filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.xz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
3
Candle_Snorkel-Mistral-PairRM-DPO_f16.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_f16.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:0ff77e0b2a84de685fd2b4e5a2ad718d5f8a9c02e409322bfb690353d98283de
|
||||||
|
size 14484018912
|
||||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q2k.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q2k.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:0e181a80f85ad3b18a0f76c69d9f8cdb69e077d027930f4ae9f19a8c83ca96fe
|
||||||
|
size 2377193184
|
||||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q3k.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q3k.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:77a37be2805c28ece6558e091a89cf048de7c2430f3d7ac8179dde413d69fd3d
|
||||||
|
size 3112654560
|
||||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q4_0.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q4_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:8a4038baa0fd02843a4b33d7a7e8198c547165ed5028bc41289bb7bc19c9e2a0
|
||||||
|
size 4074411744
|
||||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q4_1.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q4_1.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:cab3ad810f852ea5fdb54689b3973c7049d4d89a81e22117b10253d9a3b16729
|
||||||
|
size 4527003360
|
||||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q4k.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q4k.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:dfa7fd34dcccd2a2c1b953d269b0c85a23aae5625687defe16b59061a3eb75ae
|
||||||
|
size 4074411744
|
||||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q5_0.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q5_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:49892e1db1135ea3f64a6986ec1b9553fbfff190736a04652b227cfca3705b9e
|
||||||
|
size 4979594976
|
||||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q5_1.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q5_1.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:a5b013e16292c2fbb628b4aad7d3ba0b951ba6710e82b3fddfad81cac0f045eb
|
||||||
|
size 5432186592
|
||||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q5k.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q5k.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:cfadf47bb01ee2711f49447de922512c8e059e6500a17f82119309dfbef633e9
|
||||||
|
size 4979594976
|
||||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q6k.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q6k.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:ecb002750ea05bc5610218661a78c3a5a4b276363cbab1e3b033fffd5e948965
|
||||||
|
size 5941352160
|
||||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q8_0.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q8_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:fc084c16f9c0cee6003f6fda43b98b7d0c01aa961f90f6a1d0e8a5cc2146b580
|
||||||
|
size 7695144672
|
||||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q8_1.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q8_1.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:d1645984e17e857132ee83e8dffe03dc97de0f1f6269b5754e6dbbffe9423f3d
|
||||||
|
size 8147736288
|
||||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q8k.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q8k.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:d1d0dfd9ae734b3f0979f94496f7db31b08e22f0f350308eac44bcbaa4a1fbad
|
||||||
|
size 8260884192
|
||||||
26
config.json
Normal file
26
config.json
Normal file
@@ -0,0 +1,26 @@
|
|||||||
|
{
|
||||||
|
"_name_or_path": "./models_dpo/snorkel_model_0117_20k_mistral_v02_llm_blender_v5",
|
||||||
|
"architectures": [
|
||||||
|
"MistralForCausalLM"
|
||||||
|
],
|
||||||
|
"attention_dropout": 0.0,
|
||||||
|
"bos_token_id": 1,
|
||||||
|
"eos_token_id": 2,
|
||||||
|
"hidden_act": "silu",
|
||||||
|
"hidden_size": 4096,
|
||||||
|
"initializer_range": 0.02,
|
||||||
|
"intermediate_size": 14336,
|
||||||
|
"max_position_embeddings": 32768,
|
||||||
|
"model_type": "mistral",
|
||||||
|
"num_attention_heads": 32,
|
||||||
|
"num_hidden_layers": 32,
|
||||||
|
"num_key_value_heads": 8,
|
||||||
|
"rms_norm_eps": 1e-05,
|
||||||
|
"rope_theta": 1000000.0,
|
||||||
|
"sliding_window": 4096,
|
||||||
|
"tie_word_embeddings": false,
|
||||||
|
"torch_dtype": "bfloat16",
|
||||||
|
"transformers_version": "4.34.0",
|
||||||
|
"use_cache": true,
|
||||||
|
"vocab_size": 32000
|
||||||
|
}
|
||||||
3
model-00001-of-00002.safetensors
Normal file
3
model-00001-of-00002.safetensors
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:7d6394774cc65e3bdb29fd6a0ac5564d7ec1d280ff15b8388008e2b147cfb7a8
|
||||||
|
size 9942981664
|
||||||
3
model-00002-of-00002.safetensors
Normal file
3
model-00002-of-00002.safetensors
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:abb3a6c68776de48d4d69f311503150a36b60df47bf0736fc27feca271ad0efa
|
||||||
|
size 4540516312
|
||||||
91122
tokenizer.json
Normal file
91122
tokenizer.json
Normal file
File diff suppressed because it is too large
Load Diff
45
tokenizer_config.json
Normal file
45
tokenizer_config.json
Normal file
@@ -0,0 +1,45 @@
|
|||||||
|
{
|
||||||
|
"added_tokens_decoder": {
|
||||||
|
"0": {
|
||||||
|
"content": "<unk>",
|
||||||
|
"lstrip": false,
|
||||||
|
"normalized": false,
|
||||||
|
"rstrip": false,
|
||||||
|
"single_word": false,
|
||||||
|
"special": true
|
||||||
|
},
|
||||||
|
"1": {
|
||||||
|
"content": "<s>",
|
||||||
|
"lstrip": false,
|
||||||
|
"normalized": false,
|
||||||
|
"rstrip": false,
|
||||||
|
"single_word": false,
|
||||||
|
"special": true
|
||||||
|
},
|
||||||
|
"2": {
|
||||||
|
"content": "</s>",
|
||||||
|
"lstrip": false,
|
||||||
|
"normalized": false,
|
||||||
|
"rstrip": false,
|
||||||
|
"single_word": false,
|
||||||
|
"special": true
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"additional_special_tokens": [
|
||||||
|
"<unk>",
|
||||||
|
"<s>",
|
||||||
|
"</s>"
|
||||||
|
],
|
||||||
|
"bos_token": "<s>",
|
||||||
|
"chat_template": "{{ bos_token }}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if message['role'] == 'user' %}{{ '[INST] ' + message['content'] + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ message['content'] + eos_token}}{% else %}{{ raise_exception('Only user and assistant roles are supported!') }}{% endif %}{% endfor %}",
|
||||||
|
"clean_up_tokenization_spaces": false,
|
||||||
|
"eos_token": "</s>",
|
||||||
|
"legacy": true,
|
||||||
|
"model_max_length": 2048,
|
||||||
|
"pad_token": "</s>",
|
||||||
|
"sp_model_kwargs": {},
|
||||||
|
"spaces_between_special_tokens": false,
|
||||||
|
"tokenizer_class": "LlamaTokenizer",
|
||||||
|
"unk_token": "<unk>",
|
||||||
|
"use_default_system_prompt": false
|
||||||
|
}
|
||||||
Reference in New Issue
Block a user