初始化项目,由ModelHub XC社区提供模型
Model: DanielClough/Candle_Snorkel-Mistral-PairRM-DPO Source: Original Platform
This commit is contained in:
36
.gitattributes
vendored
Normal file
36
.gitattributes
vendored
Normal file
@@ -0,0 +1,36 @@
|
||||
*.7z filter=lfs diff=lfs merge=lfs -text
|
||||
*.arrow filter=lfs diff=lfs merge=lfs -text
|
||||
*.bin filter=lfs diff=lfs merge=lfs -text
|
||||
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
||||
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
||||
*.ftz filter=lfs diff=lfs merge=lfs -text
|
||||
*.gz filter=lfs diff=lfs merge=lfs -text
|
||||
*.h5 filter=lfs diff=lfs merge=lfs -text
|
||||
*.joblib filter=lfs diff=lfs merge=lfs -text
|
||||
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
||||
*.model filter=lfs diff=lfs merge=lfs -text
|
||||
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||
*.npy filter=lfs diff=lfs merge=lfs -text
|
||||
*.npz filter=lfs diff=lfs merge=lfs -text
|
||||
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||
*.parquet filter=lfs diff=lfs merge=lfs -text
|
||||
*.pb filter=lfs diff=lfs merge=lfs -text
|
||||
*.pickle filter=lfs diff=lfs merge=lfs -text
|
||||
*.pkl filter=lfs diff=lfs merge=lfs -text
|
||||
*.pt filter=lfs diff=lfs merge=lfs -text
|
||||
*.pth filter=lfs diff=lfs merge=lfs -text
|
||||
*.rar filter=lfs diff=lfs merge=lfs -text
|
||||
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
||||
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar filter=lfs diff=lfs merge=lfs -text
|
||||
*.tflite filter=lfs diff=lfs merge=lfs -text
|
||||
*.tgz filter=lfs diff=lfs merge=lfs -text
|
||||
*.wasm filter=lfs diff=lfs merge=lfs -text
|
||||
*.xz filter=lfs diff=lfs merge=lfs -text
|
||||
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||
*.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
3
Candle_Snorkel-Mistral-PairRM-DPO_f16.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_f16.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:0ff77e0b2a84de685fd2b4e5a2ad718d5f8a9c02e409322bfb690353d98283de
|
||||
size 14484018912
|
||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q2k.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q2k.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:0e181a80f85ad3b18a0f76c69d9f8cdb69e077d027930f4ae9f19a8c83ca96fe
|
||||
size 2377193184
|
||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q3k.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q3k.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:77a37be2805c28ece6558e091a89cf048de7c2430f3d7ac8179dde413d69fd3d
|
||||
size 3112654560
|
||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q4_0.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q4_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:8a4038baa0fd02843a4b33d7a7e8198c547165ed5028bc41289bb7bc19c9e2a0
|
||||
size 4074411744
|
||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q4_1.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q4_1.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:cab3ad810f852ea5fdb54689b3973c7049d4d89a81e22117b10253d9a3b16729
|
||||
size 4527003360
|
||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q4k.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q4k.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:dfa7fd34dcccd2a2c1b953d269b0c85a23aae5625687defe16b59061a3eb75ae
|
||||
size 4074411744
|
||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q5_0.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q5_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:49892e1db1135ea3f64a6986ec1b9553fbfff190736a04652b227cfca3705b9e
|
||||
size 4979594976
|
||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q5_1.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q5_1.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:a5b013e16292c2fbb628b4aad7d3ba0b951ba6710e82b3fddfad81cac0f045eb
|
||||
size 5432186592
|
||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q5k.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q5k.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:cfadf47bb01ee2711f49447de922512c8e059e6500a17f82119309dfbef633e9
|
||||
size 4979594976
|
||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q6k.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q6k.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:ecb002750ea05bc5610218661a78c3a5a4b276363cbab1e3b033fffd5e948965
|
||||
size 5941352160
|
||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q8_0.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q8_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:fc084c16f9c0cee6003f6fda43b98b7d0c01aa961f90f6a1d0e8a5cc2146b580
|
||||
size 7695144672
|
||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q8_1.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q8_1.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:d1645984e17e857132ee83e8dffe03dc97de0f1f6269b5754e6dbbffe9423f3d
|
||||
size 8147736288
|
||||
3
Candle_Snorkel-Mistral-PairRM-DPO_q8k.gguf
Normal file
3
Candle_Snorkel-Mistral-PairRM-DPO_q8k.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:d1d0dfd9ae734b3f0979f94496f7db31b08e22f0f350308eac44bcbaa4a1fbad
|
||||
size 8260884192
|
||||
26
config.json
Normal file
26
config.json
Normal file
@@ -0,0 +1,26 @@
|
||||
{
|
||||
"_name_or_path": "./models_dpo/snorkel_model_0117_20k_mistral_v02_llm_blender_v5",
|
||||
"architectures": [
|
||||
"MistralForCausalLM"
|
||||
],
|
||||
"attention_dropout": 0.0,
|
||||
"bos_token_id": 1,
|
||||
"eos_token_id": 2,
|
||||
"hidden_act": "silu",
|
||||
"hidden_size": 4096,
|
||||
"initializer_range": 0.02,
|
||||
"intermediate_size": 14336,
|
||||
"max_position_embeddings": 32768,
|
||||
"model_type": "mistral",
|
||||
"num_attention_heads": 32,
|
||||
"num_hidden_layers": 32,
|
||||
"num_key_value_heads": 8,
|
||||
"rms_norm_eps": 1e-05,
|
||||
"rope_theta": 1000000.0,
|
||||
"sliding_window": 4096,
|
||||
"tie_word_embeddings": false,
|
||||
"torch_dtype": "bfloat16",
|
||||
"transformers_version": "4.34.0",
|
||||
"use_cache": true,
|
||||
"vocab_size": 32000
|
||||
}
|
||||
3
model-00001-of-00002.safetensors
Normal file
3
model-00001-of-00002.safetensors
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:7d6394774cc65e3bdb29fd6a0ac5564d7ec1d280ff15b8388008e2b147cfb7a8
|
||||
size 9942981664
|
||||
3
model-00002-of-00002.safetensors
Normal file
3
model-00002-of-00002.safetensors
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:abb3a6c68776de48d4d69f311503150a36b60df47bf0736fc27feca271ad0efa
|
||||
size 4540516312
|
||||
91122
tokenizer.json
Normal file
91122
tokenizer.json
Normal file
File diff suppressed because it is too large
Load Diff
45
tokenizer_config.json
Normal file
45
tokenizer_config.json
Normal file
@@ -0,0 +1,45 @@
|
||||
{
|
||||
"added_tokens_decoder": {
|
||||
"0": {
|
||||
"content": "<unk>",
|
||||
"lstrip": false,
|
||||
"normalized": false,
|
||||
"rstrip": false,
|
||||
"single_word": false,
|
||||
"special": true
|
||||
},
|
||||
"1": {
|
||||
"content": "<s>",
|
||||
"lstrip": false,
|
||||
"normalized": false,
|
||||
"rstrip": false,
|
||||
"single_word": false,
|
||||
"special": true
|
||||
},
|
||||
"2": {
|
||||
"content": "</s>",
|
||||
"lstrip": false,
|
||||
"normalized": false,
|
||||
"rstrip": false,
|
||||
"single_word": false,
|
||||
"special": true
|
||||
}
|
||||
},
|
||||
"additional_special_tokens": [
|
||||
"<unk>",
|
||||
"<s>",
|
||||
"</s>"
|
||||
],
|
||||
"bos_token": "<s>",
|
||||
"chat_template": "{{ bos_token }}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if message['role'] == 'user' %}{{ '[INST] ' + message['content'] + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ message['content'] + eos_token}}{% else %}{{ raise_exception('Only user and assistant roles are supported!') }}{% endif %}{% endfor %}",
|
||||
"clean_up_tokenization_spaces": false,
|
||||
"eos_token": "</s>",
|
||||
"legacy": true,
|
||||
"model_max_length": 2048,
|
||||
"pad_token": "</s>",
|
||||
"sp_model_kwargs": {},
|
||||
"spaces_between_special_tokens": false,
|
||||
"tokenizer_class": "LlamaTokenizer",
|
||||
"unk_token": "<unk>",
|
||||
"use_default_system_prompt": false
|
||||
}
|
||||
Reference in New Issue
Block a user