初始化项目,由ModelHub XC社区提供模型
Model: Undi95/Llama-3-LewdPlay-8B-evo Source: Original Platform
This commit is contained in:
49
.gitattributes
vendored
Normal file
49
.gitattributes
vendored
Normal file
@@ -0,0 +1,49 @@
|
||||
*.7z filter=lfs diff=lfs merge=lfs -text
|
||||
*.arrow filter=lfs diff=lfs merge=lfs -text
|
||||
*.bin filter=lfs diff=lfs merge=lfs -text
|
||||
*.bin.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
||||
*.ftz filter=lfs diff=lfs merge=lfs -text
|
||||
*.gz filter=lfs diff=lfs merge=lfs -text
|
||||
*.h5 filter=lfs diff=lfs merge=lfs -text
|
||||
*.joblib filter=lfs diff=lfs merge=lfs -text
|
||||
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.model filter=lfs diff=lfs merge=lfs -text
|
||||
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||
*.parquet filter=lfs diff=lfs merge=lfs -text
|
||||
*.pb filter=lfs diff=lfs merge=lfs -text
|
||||
*.pt filter=lfs diff=lfs merge=lfs -text
|
||||
*.pth filter=lfs diff=lfs merge=lfs -text
|
||||
*.rar filter=lfs diff=lfs merge=lfs -text
|
||||
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tflite filter=lfs diff=lfs merge=lfs -text
|
||||
*.tgz filter=lfs diff=lfs merge=lfs -text
|
||||
*.xz filter=lfs diff=lfs merge=lfs -text
|
||||
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||
*.zstandard filter=lfs diff=lfs merge=lfs -text
|
||||
*.tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||
*.db* filter=lfs diff=lfs merge=lfs -text
|
||||
*.ark* filter=lfs diff=lfs merge=lfs -text
|
||||
**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text
|
||||
**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text
|
||||
**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text
|
||||
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
||||
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
||||
*.gguf* filter=lfs diff=lfs merge=lfs -text
|
||||
*.ggml filter=lfs diff=lfs merge=lfs -text
|
||||
*.llamafile* filter=lfs diff=lfs merge=lfs -text
|
||||
*.pt2 filter=lfs diff=lfs merge=lfs -text
|
||||
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
||||
*.npy filter=lfs diff=lfs merge=lfs -text
|
||||
*.npz filter=lfs diff=lfs merge=lfs -text
|
||||
*.pickle filter=lfs diff=lfs merge=lfs -text
|
||||
*.pkl filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar filter=lfs diff=lfs merge=lfs -text
|
||||
*.wasm filter=lfs diff=lfs merge=lfs -text
|
||||
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||
|
||||
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
||||
188
README.md
Normal file
188
README.md
Normal file
@@ -0,0 +1,188 @@
|
||||
---
|
||||
license: cc-by-nc-4.0
|
||||
base_model:
|
||||
- vicgalle/Roleplay-Llama-3-8B
|
||||
- Undi95/Llama-3-Unholy-8B-e4
|
||||
- Undi95/Llama-3-LewdPlay-8B
|
||||
library_name: transformers
|
||||
tags:
|
||||
- mergekit
|
||||
- merge
|
||||
---
|
||||
|
||||
# LewdPlay-8B
|
||||
|
||||
This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
|
||||
|
||||
The new EVOLVE merge method was used (on MMLU specifically), see below for more information!
|
||||
|
||||
Unholy was used for uncensoring, Roleplay Llama 3 for the DPO train he got on top, and LewdPlay for the... lewd side.
|
||||
|
||||
## Prompt template: Llama3
|
||||
|
||||
```
|
||||
<|begin_of_text|><|start_header_id|>system<|end_header_id|>
|
||||
|
||||
{system_prompt}<|eot_id|><|start_header_id|>user<|end_header_id|>
|
||||
|
||||
{input}<|eot_id|><|start_header_id|>assistant<|end_header_id|>
|
||||
|
||||
{output}<|eot_id|>
|
||||
```
|
||||
|
||||
## Merge Details
|
||||
### Merge Method
|
||||
|
||||
This model was merged using the [DARE](https://arxiv.org/abs/2311.03099) [TIES](https://arxiv.org/abs/2306.01708) merge method using ./mergekit/input_models/Roleplay-Llama-3-8B_213413727 as a base.
|
||||
|
||||
### Models Merged
|
||||
|
||||
The following models were included in the merge:
|
||||
* ./mergekit/input_models/Llama-3-Unholy-8B-e4_1440388923
|
||||
* ./mergekit/input_models/Llama-3-LewdPlay-8B-e3_2981937066
|
||||
|
||||
### Configuration
|
||||
|
||||
The following YAML configuration was used to produce this model:
|
||||
|
||||
```yaml
|
||||
base_model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
dtype: bfloat16
|
||||
merge_method: dare_ties
|
||||
parameters:
|
||||
int8_mask: 1.0
|
||||
normalize: 0.0
|
||||
slices:
|
||||
- sources:
|
||||
- layer_range: [0, 4]
|
||||
model: ./mergekit/input_models/Llama-3-LewdPlay-8B-e3_2981937066
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.6861808716092435
|
||||
- layer_range: [0, 4]
|
||||
model: ./mergekit/input_models/Llama-3-Unholy-8B-e4_1440388923
|
||||
parameters:
|
||||
density: 0.6628290134113985
|
||||
weight: 0.5815923052193855
|
||||
- layer_range: [0, 4]
|
||||
model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.5113886163963061
|
||||
- sources:
|
||||
- layer_range: [4, 8]
|
||||
model: ./mergekit/input_models/Llama-3-LewdPlay-8B-e3_2981937066
|
||||
parameters:
|
||||
density: 0.892655547455918
|
||||
weight: 0.038732602391021484
|
||||
- layer_range: [4, 8]
|
||||
model: ./mergekit/input_models/Llama-3-Unholy-8B-e4_1440388923
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.1982145486303527
|
||||
- layer_range: [4, 8]
|
||||
model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.6843011350690802
|
||||
- sources:
|
||||
- layer_range: [8, 12]
|
||||
model: ./mergekit/input_models/Llama-3-LewdPlay-8B-e3_2981937066
|
||||
parameters:
|
||||
density: 0.7817511027396784
|
||||
weight: 0.13053333213489704
|
||||
- layer_range: [8, 12]
|
||||
model: ./mergekit/input_models/Llama-3-Unholy-8B-e4_1440388923
|
||||
parameters:
|
||||
density: 0.6963703515864826
|
||||
weight: 0.20525481492667985
|
||||
- layer_range: [8, 12]
|
||||
model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
parameters:
|
||||
density: 0.6983086326765777
|
||||
weight: 0.5843953969574106
|
||||
- sources:
|
||||
- layer_range: [12, 16]
|
||||
model: ./mergekit/input_models/Llama-3-LewdPlay-8B-e3_2981937066
|
||||
parameters:
|
||||
density: 0.9632895768462915
|
||||
weight: 0.2101146706607748
|
||||
- layer_range: [12, 16]
|
||||
model: ./mergekit/input_models/Llama-3-Unholy-8B-e4_1440388923
|
||||
parameters:
|
||||
density: 0.597557434542081
|
||||
weight: 0.6728172621848589
|
||||
- layer_range: [12, 16]
|
||||
model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
parameters:
|
||||
density: 0.756263557607837
|
||||
weight: 0.2581423726361908
|
||||
- sources:
|
||||
- layer_range: [16, 20]
|
||||
model: ./mergekit/input_models/Llama-3-LewdPlay-8B-e3_2981937066
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.2116035543552448
|
||||
- layer_range: [16, 20]
|
||||
model: ./mergekit/input_models/Llama-3-Unholy-8B-e4_1440388923
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.22654226422958418
|
||||
- layer_range: [16, 20]
|
||||
model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
parameters:
|
||||
density: 0.8925914810507647
|
||||
weight: 0.42243766315440867
|
||||
- sources:
|
||||
- layer_range: [20, 24]
|
||||
model: ./mergekit/input_models/Llama-3-LewdPlay-8B-e3_2981937066
|
||||
parameters:
|
||||
density: 0.7697608089825734
|
||||
weight: 0.1535118632140203
|
||||
- layer_range: [20, 24]
|
||||
model: ./mergekit/input_models/Llama-3-Unholy-8B-e4_1440388923
|
||||
parameters:
|
||||
density: 0.9886758076773643
|
||||
weight: 0.3305040603868546
|
||||
- layer_range: [20, 24]
|
||||
model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.40670083428654535
|
||||
- sources:
|
||||
- layer_range: [24, 28]
|
||||
model: ./mergekit/input_models/Llama-3-LewdPlay-8B-e3_2981937066
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.4542810478500622
|
||||
- layer_range: [24, 28]
|
||||
model: ./mergekit/input_models/Llama-3-Unholy-8B-e4_1440388923
|
||||
parameters:
|
||||
density: 0.8330662483310117
|
||||
weight: 0.2587495367324508
|
||||
- layer_range: [24, 28]
|
||||
model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
parameters:
|
||||
density: 0.9845313983551542
|
||||
weight: 0.40378452705975915
|
||||
- sources:
|
||||
- layer_range: [28, 32]
|
||||
model: ./mergekit/input_models/Llama-3-LewdPlay-8B-e3_2981937066
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.2951962192288415
|
||||
- layer_range: [28, 32]
|
||||
model: ./mergekit/input_models/Llama-3-Unholy-8B-e4_1440388923
|
||||
parameters:
|
||||
density: 0.960315594933433
|
||||
weight: 0.13142971773782525
|
||||
- layer_range: [28, 32]
|
||||
model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.30838472094518804
|
||||
```
|
||||
|
||||
## Support
|
||||
|
||||
If you want to support me, you can [here](https://ko-fi.com/undiai).
|
||||
28
config.json
Normal file
28
config.json
Normal file
@@ -0,0 +1,28 @@
|
||||
{
|
||||
"_name_or_path": "./mergekit/input_models/Roleplay-Llama-3-8B_213413727",
|
||||
"architectures": [
|
||||
"LlamaForCausalLM"
|
||||
],
|
||||
"attention_bias": false,
|
||||
"attention_dropout": 0.0,
|
||||
"bos_token_id": 128000,
|
||||
"eos_token_id": 128001,
|
||||
"hidden_act": "silu",
|
||||
"hidden_size": 4096,
|
||||
"initializer_range": 0.02,
|
||||
"intermediate_size": 14336,
|
||||
"max_position_embeddings": 8192,
|
||||
"model_type": "llama",
|
||||
"num_attention_heads": 32,
|
||||
"num_hidden_layers": 32,
|
||||
"num_key_value_heads": 8,
|
||||
"pretraining_tp": 1,
|
||||
"rms_norm_eps": 1e-05,
|
||||
"rope_scaling": null,
|
||||
"rope_theta": 500000.0,
|
||||
"tie_word_embeddings": false,
|
||||
"torch_dtype": "bfloat16",
|
||||
"transformers_version": "4.40.0",
|
||||
"use_cache": true,
|
||||
"vocab_size": 128256
|
||||
}
|
||||
1
configuration.json
Normal file
1
configuration.json
Normal file
@@ -0,0 +1 @@
|
||||
{"framework": "pytorch", "task": "text-generation", "allow_remote": true}
|
||||
135
mergekit_config.yml
Normal file
135
mergekit_config.yml
Normal file
@@ -0,0 +1,135 @@
|
||||
base_model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
dtype: bfloat16
|
||||
merge_method: dare_ties
|
||||
parameters:
|
||||
int8_mask: 1.0
|
||||
normalize: 0.0
|
||||
slices:
|
||||
- sources:
|
||||
- layer_range: [0, 4]
|
||||
model: ./mergekit/input_models/Llama-3-LewdPlay-8B-e3_2981937066
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.6861808716092435
|
||||
- layer_range: [0, 4]
|
||||
model: ./mergekit/input_models/Llama-3-Unholy-8B-e4_1440388923
|
||||
parameters:
|
||||
density: 0.6628290134113985
|
||||
weight: 0.5815923052193855
|
||||
- layer_range: [0, 4]
|
||||
model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.5113886163963061
|
||||
- sources:
|
||||
- layer_range: [4, 8]
|
||||
model: ./mergekit/input_models/Llama-3-LewdPlay-8B-e3_2981937066
|
||||
parameters:
|
||||
density: 0.892655547455918
|
||||
weight: 0.038732602391021484
|
||||
- layer_range: [4, 8]
|
||||
model: ./mergekit/input_models/Llama-3-Unholy-8B-e4_1440388923
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.1982145486303527
|
||||
- layer_range: [4, 8]
|
||||
model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.6843011350690802
|
||||
- sources:
|
||||
- layer_range: [8, 12]
|
||||
model: ./mergekit/input_models/Llama-3-LewdPlay-8B-e3_2981937066
|
||||
parameters:
|
||||
density: 0.7817511027396784
|
||||
weight: 0.13053333213489704
|
||||
- layer_range: [8, 12]
|
||||
model: ./mergekit/input_models/Llama-3-Unholy-8B-e4_1440388923
|
||||
parameters:
|
||||
density: 0.6963703515864826
|
||||
weight: 0.20525481492667985
|
||||
- layer_range: [8, 12]
|
||||
model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
parameters:
|
||||
density: 0.6983086326765777
|
||||
weight: 0.5843953969574106
|
||||
- sources:
|
||||
- layer_range: [12, 16]
|
||||
model: ./mergekit/input_models/Llama-3-LewdPlay-8B-e3_2981937066
|
||||
parameters:
|
||||
density: 0.9632895768462915
|
||||
weight: 0.2101146706607748
|
||||
- layer_range: [12, 16]
|
||||
model: ./mergekit/input_models/Llama-3-Unholy-8B-e4_1440388923
|
||||
parameters:
|
||||
density: 0.597557434542081
|
||||
weight: 0.6728172621848589
|
||||
- layer_range: [12, 16]
|
||||
model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
parameters:
|
||||
density: 0.756263557607837
|
||||
weight: 0.2581423726361908
|
||||
- sources:
|
||||
- layer_range: [16, 20]
|
||||
model: ./mergekit/input_models/Llama-3-LewdPlay-8B-e3_2981937066
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.2116035543552448
|
||||
- layer_range: [16, 20]
|
||||
model: ./mergekit/input_models/Llama-3-Unholy-8B-e4_1440388923
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.22654226422958418
|
||||
- layer_range: [16, 20]
|
||||
model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
parameters:
|
||||
density: 0.8925914810507647
|
||||
weight: 0.42243766315440867
|
||||
- sources:
|
||||
- layer_range: [20, 24]
|
||||
model: ./mergekit/input_models/Llama-3-LewdPlay-8B-e3_2981937066
|
||||
parameters:
|
||||
density: 0.7697608089825734
|
||||
weight: 0.1535118632140203
|
||||
- layer_range: [20, 24]
|
||||
model: ./mergekit/input_models/Llama-3-Unholy-8B-e4_1440388923
|
||||
parameters:
|
||||
density: 0.9886758076773643
|
||||
weight: 0.3305040603868546
|
||||
- layer_range: [20, 24]
|
||||
model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.40670083428654535
|
||||
- sources:
|
||||
- layer_range: [24, 28]
|
||||
model: ./mergekit/input_models/Llama-3-LewdPlay-8B-e3_2981937066
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.4542810478500622
|
||||
- layer_range: [24, 28]
|
||||
model: ./mergekit/input_models/Llama-3-Unholy-8B-e4_1440388923
|
||||
parameters:
|
||||
density: 0.8330662483310117
|
||||
weight: 0.2587495367324508
|
||||
- layer_range: [24, 28]
|
||||
model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
parameters:
|
||||
density: 0.9845313983551542
|
||||
weight: 0.40378452705975915
|
||||
- sources:
|
||||
- layer_range: [28, 32]
|
||||
model: ./mergekit/input_models/Llama-3-LewdPlay-8B-e3_2981937066
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.2951962192288415
|
||||
- layer_range: [28, 32]
|
||||
model: ./mergekit/input_models/Llama-3-Unholy-8B-e4_1440388923
|
||||
parameters:
|
||||
density: 0.960315594933433
|
||||
weight: 0.13142971773782525
|
||||
- layer_range: [28, 32]
|
||||
model: ./mergekit/input_models/Roleplay-Llama-3-8B_213413727
|
||||
parameters:
|
||||
density: 1.0
|
||||
weight: 0.30838472094518804
|
||||
3
model-00001-of-00002.safetensors
Normal file
3
model-00001-of-00002.safetensors
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:a8a08becf33e6d4967e7cfbd3e362d8efc9cd560135ff9089fd3c9ae47241ee4
|
||||
size 9953405736
|
||||
3
model-00002-of-00002.safetensors
Normal file
3
model-00002-of-00002.safetensors
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:d608e696acd6e5ec6f882e97f7812fdeb357d4dfb081c0b3a75542a9e0235902
|
||||
size 6107150624
|
||||
1
model.safetensors.index.json
Normal file
1
model.safetensors.index.json
Normal file
File diff suppressed because one or more lines are too long
16
special_tokens_map.json
Normal file
16
special_tokens_map.json
Normal file
@@ -0,0 +1,16 @@
|
||||
{
|
||||
"bos_token": {
|
||||
"content": "<|begin_of_text|>",
|
||||
"lstrip": false,
|
||||
"normalized": false,
|
||||
"rstrip": false,
|
||||
"single_word": false
|
||||
},
|
||||
"eos_token": {
|
||||
"content": "<|end_of_text|>",
|
||||
"lstrip": false,
|
||||
"normalized": false,
|
||||
"rstrip": false,
|
||||
"single_word": false
|
||||
}
|
||||
}
|
||||
3
tokenizer.json
Normal file
3
tokenizer.json
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:c05a3c2174e9edd5be19dc5a0748c42a9037bec2811ce062728bfd71f8702d78
|
||||
size 9084490
|
||||
2062
tokenizer_config.json
Normal file
2062
tokenizer_config.json
Normal file
File diff suppressed because it is too large
Load Diff
Reference in New Issue
Block a user