初始化项目,由ModelHub XC社区提供模型
Model: erfanzar/MaticGPT Source: Original Platform
This commit is contained in:
44
.gitattributes
vendored
Normal file
44
.gitattributes
vendored
Normal file
@@ -0,0 +1,44 @@
|
|||||||
|
*.7z filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.arrow filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.bin filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.ftz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.gz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.h5 filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.joblib filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.model filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.npy filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.npz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.parquet filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pb filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pickle filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pkl filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pt filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.pth filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.rar filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
||||||
|
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.tar filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.tflite filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.tgz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.wasm filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.xz filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||||
|
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||||
|
MaticGPT-GGUF.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
MaticGPT-GGUF.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
MaticGPT-GGUF.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
MaticGPT-GGUF.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
MaticGPT-GGUF.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
MaticGPT-GGUF.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
MaticGPT-GGUF.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
MaticGPT-GGUF.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
|
MaticGPT-GGUF.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||||
3
MaticGPT-GGUF.Q2_K.gguf
Normal file
3
MaticGPT-GGUF.Q2_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:9bcce6acaf3b955e8342f2862200907680da7d3cb6e2a9ee2818b9eb14d0f967
|
||||||
|
size 432130656
|
||||||
3
MaticGPT-GGUF.Q3_K_L.gguf
Normal file
3
MaticGPT-GGUF.Q3_K_L.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:5db9495f38fb7bb5aa6e642500054b56dd161a5940a7f80389849eb5f8305316
|
||||||
|
size 591526496
|
||||||
3
MaticGPT-GGUF.Q3_K_M.gguf
Normal file
3
MaticGPT-GGUF.Q3_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:7aa1393951332b7d7b5ea10e2dead86fbe772f6f2833b846573bc871bc04054b
|
||||||
|
size 548403808
|
||||||
3
MaticGPT-GGUF.Q3_K_S.gguf
Normal file
3
MaticGPT-GGUF.Q3_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:47e9738b40c0cc273d668813db1c40840e5aab5ea0b53df01702b421e95940da
|
||||||
|
size 499341920
|
||||||
3
MaticGPT-GGUF.Q4_K_M.gguf
Normal file
3
MaticGPT-GGUF.Q4_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:eb794914dc0ad4c0e7145888946f091d512dff91c5313f518c2afb9e69a25539
|
||||||
|
size 667814496
|
||||||
3
MaticGPT-GGUF.Q4_K_S.gguf
Normal file
3
MaticGPT-GGUF.Q4_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:f0feb80cef32a3d098b910e7834464d8ab95b930cff46e12b7cb1d4091475f13
|
||||||
|
size 639871584
|
||||||
3
MaticGPT-GGUF.Q5_K_M.gguf
Normal file
3
MaticGPT-GGUF.Q5_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:a637e189c6ef036ee521ce2e911125b504b3161277d784e3c03094e880afc2c6
|
||||||
|
size 782043744
|
||||||
3
MaticGPT-GGUF.Q5_K_S.gguf
Normal file
3
MaticGPT-GGUF.Q5_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:7ded321f6fe4e260b8f5d5fc6ce5364651387df677ddd0d8ecbb275301160f94
|
||||||
|
size 766028384
|
||||||
3
MaticGPT-GGUF.Q6_K.gguf
Normal file
3
MaticGPT-GGUF.Q6_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:ff1a59c3f30cefceabe350b92032ce2df36c598b96cf6c2e08730f58d0e4d2a1
|
||||||
|
size 903412320
|
||||||
51
README.md
Normal file
51
README.md
Normal file
@@ -0,0 +1,51 @@
|
|||||||
|
---
|
||||||
|
datasets:
|
||||||
|
- erfanzar/ShareGPT4
|
||||||
|
- HuggingFaceH4/no_robots
|
||||||
|
language:
|
||||||
|
- en
|
||||||
|
- fr
|
||||||
|
- es
|
||||||
|
- zh
|
||||||
|
- ru
|
||||||
|
metrics:
|
||||||
|
- accuracy
|
||||||
|
pipeline_tag: text-generation
|
||||||
|
license: mit
|
||||||
|
---
|
||||||
|
|
||||||
|
# LinguaMatic
|
||||||
|
|
||||||
|
LinguaMatic is an advanced AI model designed to handle a wide range of Natural Language Processing (NLP) tasks. With its powerful capabilities, LinguaMatic can assist with tasks such as text classification, sentiment analysis, language translation, question answering, and much more.
|
||||||
|
|
||||||
|
## EasyDel
|
||||||
|
|
||||||
|
The model is finetuned Using a custom version of UltraChat on TPU-v4 POD using [EasyDel](https://github.com/erfanzar/EasyDeL)
|
||||||
|
|
||||||
|
## Prompting Method
|
||||||
|
|
||||||
|
LinguaMatic utilizes the llama2 prompting method to generate responses. This method, named after the friendly and intelligent llama, enhances the model's ability to engage in meaningful conversations. The `prompt_model` function provided below demonstrates how the llama2 prompting method is implemented:
|
||||||
|
|
||||||
|
```python
|
||||||
|
def prompt_model(
|
||||||
|
message: str,
|
||||||
|
chat_history: None | list[list[str]] = [],
|
||||||
|
system_prompt: str | None = None
|
||||||
|
) -> str:
|
||||||
|
do_strip = False
|
||||||
|
texts = [f"<s>[INST] <<SYS>>\n{system_prompt}\n<</SYS>>\n\n"] if system_prompt is not None else ["<s>[INST] "]
|
||||||
|
for user_input, response in chat_history:
|
||||||
|
user_input = user_input.strip() if do_strip else user_input
|
||||||
|
do_strip = True
|
||||||
|
texts.append(f'{user_input} [/INST] {response.strip()} </s><s>[INST] ')
|
||||||
|
message = message.strip() if do_strip else message
|
||||||
|
texts.append(f'{message} [/INST]')
|
||||||
|
return ''.join(texts)
|
||||||
|
```
|
||||||
|
|
||||||
|
The `prompt_model` function takes a `message` as input, along with the `chat_history` and `system_prompt`. It generates a formatted text that includes the system prompt, user inputs, and the current message. This approach allows LinguaMatic to maintain context and provide more coherent and context-aware responses.
|
||||||
|
|
||||||
|
|
||||||
|
## Contributing
|
||||||
|
|
||||||
|
We welcome contributions to enhance LinguaMatic's capabilities and improve its performance. If you encounter any issues or have suggestions for improvement, please feel free to submit a pull request or open an issue on [EasyDel](https://github.com/erfanzar/EasyDeL) GitHub repository.
|
||||||
102
config.json
Normal file
102
config.json
Normal file
@@ -0,0 +1,102 @@
|
|||||||
|
{
|
||||||
|
"a_ps": [
|
||||||
|
[
|
||||||
|
"dp",
|
||||||
|
"fsdp"
|
||||||
|
],
|
||||||
|
"sp",
|
||||||
|
"tp",
|
||||||
|
null
|
||||||
|
],
|
||||||
|
"architectures": [
|
||||||
|
"LlamaForCausalLM"
|
||||||
|
],
|
||||||
|
"attention_bias": false,
|
||||||
|
"attention_dropout": 0.0,
|
||||||
|
"axis_dims": [
|
||||||
|
1,
|
||||||
|
-1,
|
||||||
|
1,
|
||||||
|
1
|
||||||
|
],
|
||||||
|
"axis_names": [
|
||||||
|
"dp",
|
||||||
|
"fsdp",
|
||||||
|
"tp",
|
||||||
|
"sp"
|
||||||
|
],
|
||||||
|
"b_ps": [
|
||||||
|
[
|
||||||
|
"dp",
|
||||||
|
"fsdp"
|
||||||
|
],
|
||||||
|
null,
|
||||||
|
null,
|
||||||
|
null
|
||||||
|
],
|
||||||
|
"backend": null,
|
||||||
|
"bits": null,
|
||||||
|
"bos_token_id": 1,
|
||||||
|
"c_max_position_embeddings": 2048,
|
||||||
|
"easy_method": "train",
|
||||||
|
"embd_pdrop": 0.0,
|
||||||
|
"eos_token_id": 2,
|
||||||
|
"fcm_max_ratio": 0.0,
|
||||||
|
"fcm_min_ratio": 0.0,
|
||||||
|
"flash_attn_key_chunk_size": 1024,
|
||||||
|
"flash_attn_query_chunk_size": 1024,
|
||||||
|
"freq_max_position_embeddings": 2048,
|
||||||
|
"hidden_act": "silu",
|
||||||
|
"hidden_size": 2048,
|
||||||
|
"initializer_range": 0.02,
|
||||||
|
"intermediate_size": 5632,
|
||||||
|
"k_ps": [
|
||||||
|
[
|
||||||
|
"dp",
|
||||||
|
"fsdp"
|
||||||
|
],
|
||||||
|
"sp",
|
||||||
|
"tp",
|
||||||
|
null
|
||||||
|
],
|
||||||
|
"max_position_embeddings": 2048,
|
||||||
|
"model_type": "llama",
|
||||||
|
"num_attention_heads": 32,
|
||||||
|
"num_hidden_layers": 22,
|
||||||
|
"num_key_value_heads": 4,
|
||||||
|
"number_rep_kv": 1,
|
||||||
|
"pretraining_tp": 1,
|
||||||
|
"q_ps": [
|
||||||
|
[
|
||||||
|
"dp",
|
||||||
|
"fsdp"
|
||||||
|
],
|
||||||
|
"sp",
|
||||||
|
"tp",
|
||||||
|
null
|
||||||
|
],
|
||||||
|
"resid_pdrop": 0.0,
|
||||||
|
"rms_norm_eps": 1e-05,
|
||||||
|
"rope_scaling": null,
|
||||||
|
"rope_theta": 10000.0,
|
||||||
|
"scan_layers": true,
|
||||||
|
"scan_mlp_chunk_size": 1024,
|
||||||
|
"tie_word_embeddings": false,
|
||||||
|
"torch_dtype": "float16",
|
||||||
|
"transformers_version": "4.36.2",
|
||||||
|
"use_cache": true,
|
||||||
|
"use_flash_attention": false,
|
||||||
|
"use_pjit_attention_force": false,
|
||||||
|
"use_sacn_mlp": false,
|
||||||
|
"use_shard_map": false,
|
||||||
|
"v_ps": [
|
||||||
|
[
|
||||||
|
"dp",
|
||||||
|
"fsdp"
|
||||||
|
],
|
||||||
|
"sp",
|
||||||
|
"tp",
|
||||||
|
null
|
||||||
|
],
|
||||||
|
"vocab_size": 32000
|
||||||
|
}
|
||||||
6
generation_config.json
Normal file
6
generation_config.json
Normal file
@@ -0,0 +1,6 @@
|
|||||||
|
{
|
||||||
|
"_from_model_config": true,
|
||||||
|
"bos_token_id": 1,
|
||||||
|
"eos_token_id": 2,
|
||||||
|
"transformers_version": "4.36.2"
|
||||||
|
}
|
||||||
3
model.safetensors
Normal file
3
model.safetensors
Normal file
@@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:279873cab2e2742d9a629be2d85f0dea7214c87826365199482a8c2077ebb17d
|
||||||
|
size 2200119664
|
||||||
24
special_tokens_map.json
Normal file
24
special_tokens_map.json
Normal file
@@ -0,0 +1,24 @@
|
|||||||
|
{
|
||||||
|
"bos_token": {
|
||||||
|
"content": "<s>",
|
||||||
|
"lstrip": false,
|
||||||
|
"normalized": false,
|
||||||
|
"rstrip": false,
|
||||||
|
"single_word": false
|
||||||
|
},
|
||||||
|
"eos_token": {
|
||||||
|
"content": "</s>",
|
||||||
|
"lstrip": false,
|
||||||
|
"normalized": false,
|
||||||
|
"rstrip": false,
|
||||||
|
"single_word": false
|
||||||
|
},
|
||||||
|
"pad_token": "</s>",
|
||||||
|
"unk_token": {
|
||||||
|
"content": "<unk>",
|
||||||
|
"lstrip": false,
|
||||||
|
"normalized": false,
|
||||||
|
"rstrip": false,
|
||||||
|
"single_word": false
|
||||||
|
}
|
||||||
|
}
|
||||||
93391
tokenizer.json
Normal file
93391
tokenizer.json
Normal file
File diff suppressed because it is too large
Load Diff
BIN
tokenizer.model
(Stored with Git LFS)
Normal file
BIN
tokenizer.model
(Stored with Git LFS)
Normal file
Binary file not shown.
41
tokenizer_config.json
Normal file
41
tokenizer_config.json
Normal file
@@ -0,0 +1,41 @@
|
|||||||
|
{
|
||||||
|
"add_bos_token": true,
|
||||||
|
"add_eos_token": false,
|
||||||
|
"added_tokens_decoder": {
|
||||||
|
"0": {
|
||||||
|
"content": "<unk>",
|
||||||
|
"lstrip": false,
|
||||||
|
"normalized": false,
|
||||||
|
"rstrip": false,
|
||||||
|
"single_word": false,
|
||||||
|
"special": true
|
||||||
|
},
|
||||||
|
"1": {
|
||||||
|
"content": "<s>",
|
||||||
|
"lstrip": false,
|
||||||
|
"normalized": false,
|
||||||
|
"rstrip": false,
|
||||||
|
"single_word": false,
|
||||||
|
"special": true
|
||||||
|
},
|
||||||
|
"2": {
|
||||||
|
"content": "</s>",
|
||||||
|
"lstrip": false,
|
||||||
|
"normalized": false,
|
||||||
|
"rstrip": false,
|
||||||
|
"single_word": false,
|
||||||
|
"special": true
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"bos_token": "<s>",
|
||||||
|
"clean_up_tokenization_spaces": false,
|
||||||
|
"eos_token": "</s>",
|
||||||
|
"legacy": false,
|
||||||
|
"model_max_length": 1000000000000000019884624838656,
|
||||||
|
"pad_token": "</s>",
|
||||||
|
"padding_side": "right",
|
||||||
|
"sp_model_kwargs": {},
|
||||||
|
"tokenizer_class": "LlamaTokenizer",
|
||||||
|
"unk_token": "<unk>",
|
||||||
|
"use_default_system_prompt": false
|
||||||
|
}
|
||||||
Reference in New Issue
Block a user