初始化项目,由ModelHub XC社区提供模型
Model: erfanzar/MaticGPT Source: Original Platform
This commit is contained in:
44
.gitattributes
vendored
Normal file
44
.gitattributes
vendored
Normal file
@@ -0,0 +1,44 @@
|
||||
*.7z filter=lfs diff=lfs merge=lfs -text
|
||||
*.arrow filter=lfs diff=lfs merge=lfs -text
|
||||
*.bin filter=lfs diff=lfs merge=lfs -text
|
||||
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
||||
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
||||
*.ftz filter=lfs diff=lfs merge=lfs -text
|
||||
*.gz filter=lfs diff=lfs merge=lfs -text
|
||||
*.h5 filter=lfs diff=lfs merge=lfs -text
|
||||
*.joblib filter=lfs diff=lfs merge=lfs -text
|
||||
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
||||
*.model filter=lfs diff=lfs merge=lfs -text
|
||||
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||
*.npy filter=lfs diff=lfs merge=lfs -text
|
||||
*.npz filter=lfs diff=lfs merge=lfs -text
|
||||
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||
*.parquet filter=lfs diff=lfs merge=lfs -text
|
||||
*.pb filter=lfs diff=lfs merge=lfs -text
|
||||
*.pickle filter=lfs diff=lfs merge=lfs -text
|
||||
*.pkl filter=lfs diff=lfs merge=lfs -text
|
||||
*.pt filter=lfs diff=lfs merge=lfs -text
|
||||
*.pth filter=lfs diff=lfs merge=lfs -text
|
||||
*.rar filter=lfs diff=lfs merge=lfs -text
|
||||
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
||||
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar filter=lfs diff=lfs merge=lfs -text
|
||||
*.tflite filter=lfs diff=lfs merge=lfs -text
|
||||
*.tgz filter=lfs diff=lfs merge=lfs -text
|
||||
*.wasm filter=lfs diff=lfs merge=lfs -text
|
||||
*.xz filter=lfs diff=lfs merge=lfs -text
|
||||
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||
MaticGPT-GGUF.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
MaticGPT-GGUF.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
MaticGPT-GGUF.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
MaticGPT-GGUF.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
MaticGPT-GGUF.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
MaticGPT-GGUF.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
MaticGPT-GGUF.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
MaticGPT-GGUF.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
MaticGPT-GGUF.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
3
MaticGPT-GGUF.Q2_K.gguf
Normal file
3
MaticGPT-GGUF.Q2_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:9bcce6acaf3b955e8342f2862200907680da7d3cb6e2a9ee2818b9eb14d0f967
|
||||
size 432130656
|
||||
3
MaticGPT-GGUF.Q3_K_L.gguf
Normal file
3
MaticGPT-GGUF.Q3_K_L.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:5db9495f38fb7bb5aa6e642500054b56dd161a5940a7f80389849eb5f8305316
|
||||
size 591526496
|
||||
3
MaticGPT-GGUF.Q3_K_M.gguf
Normal file
3
MaticGPT-GGUF.Q3_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:7aa1393951332b7d7b5ea10e2dead86fbe772f6f2833b846573bc871bc04054b
|
||||
size 548403808
|
||||
3
MaticGPT-GGUF.Q3_K_S.gguf
Normal file
3
MaticGPT-GGUF.Q3_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:47e9738b40c0cc273d668813db1c40840e5aab5ea0b53df01702b421e95940da
|
||||
size 499341920
|
||||
3
MaticGPT-GGUF.Q4_K_M.gguf
Normal file
3
MaticGPT-GGUF.Q4_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:eb794914dc0ad4c0e7145888946f091d512dff91c5313f518c2afb9e69a25539
|
||||
size 667814496
|
||||
3
MaticGPT-GGUF.Q4_K_S.gguf
Normal file
3
MaticGPT-GGUF.Q4_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:f0feb80cef32a3d098b910e7834464d8ab95b930cff46e12b7cb1d4091475f13
|
||||
size 639871584
|
||||
3
MaticGPT-GGUF.Q5_K_M.gguf
Normal file
3
MaticGPT-GGUF.Q5_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:a637e189c6ef036ee521ce2e911125b504b3161277d784e3c03094e880afc2c6
|
||||
size 782043744
|
||||
3
MaticGPT-GGUF.Q5_K_S.gguf
Normal file
3
MaticGPT-GGUF.Q5_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:7ded321f6fe4e260b8f5d5fc6ce5364651387df677ddd0d8ecbb275301160f94
|
||||
size 766028384
|
||||
3
MaticGPT-GGUF.Q6_K.gguf
Normal file
3
MaticGPT-GGUF.Q6_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:ff1a59c3f30cefceabe350b92032ce2df36c598b96cf6c2e08730f58d0e4d2a1
|
||||
size 903412320
|
||||
51
README.md
Normal file
51
README.md
Normal file
@@ -0,0 +1,51 @@
|
||||
---
|
||||
datasets:
|
||||
- erfanzar/ShareGPT4
|
||||
- HuggingFaceH4/no_robots
|
||||
language:
|
||||
- en
|
||||
- fr
|
||||
- es
|
||||
- zh
|
||||
- ru
|
||||
metrics:
|
||||
- accuracy
|
||||
pipeline_tag: text-generation
|
||||
license: mit
|
||||
---
|
||||
|
||||
# LinguaMatic
|
||||
|
||||
LinguaMatic is an advanced AI model designed to handle a wide range of Natural Language Processing (NLP) tasks. With its powerful capabilities, LinguaMatic can assist with tasks such as text classification, sentiment analysis, language translation, question answering, and much more.
|
||||
|
||||
## EasyDel
|
||||
|
||||
The model is finetuned Using a custom version of UltraChat on TPU-v4 POD using [EasyDel](https://github.com/erfanzar/EasyDeL)
|
||||
|
||||
## Prompting Method
|
||||
|
||||
LinguaMatic utilizes the llama2 prompting method to generate responses. This method, named after the friendly and intelligent llama, enhances the model's ability to engage in meaningful conversations. The `prompt_model` function provided below demonstrates how the llama2 prompting method is implemented:
|
||||
|
||||
```python
|
||||
def prompt_model(
|
||||
message: str,
|
||||
chat_history: None | list[list[str]] = [],
|
||||
system_prompt: str | None = None
|
||||
) -> str:
|
||||
do_strip = False
|
||||
texts = [f"<s>[INST] <<SYS>>\n{system_prompt}\n<</SYS>>\n\n"] if system_prompt is not None else ["<s>[INST] "]
|
||||
for user_input, response in chat_history:
|
||||
user_input = user_input.strip() if do_strip else user_input
|
||||
do_strip = True
|
||||
texts.append(f'{user_input} [/INST] {response.strip()} </s><s>[INST] ')
|
||||
message = message.strip() if do_strip else message
|
||||
texts.append(f'{message} [/INST]')
|
||||
return ''.join(texts)
|
||||
```
|
||||
|
||||
The `prompt_model` function takes a `message` as input, along with the `chat_history` and `system_prompt`. It generates a formatted text that includes the system prompt, user inputs, and the current message. This approach allows LinguaMatic to maintain context and provide more coherent and context-aware responses.
|
||||
|
||||
|
||||
## Contributing
|
||||
|
||||
We welcome contributions to enhance LinguaMatic's capabilities and improve its performance. If you encounter any issues or have suggestions for improvement, please feel free to submit a pull request or open an issue on [EasyDel](https://github.com/erfanzar/EasyDeL) GitHub repository.
|
||||
102
config.json
Normal file
102
config.json
Normal file
@@ -0,0 +1,102 @@
|
||||
{
|
||||
"a_ps": [
|
||||
[
|
||||
"dp",
|
||||
"fsdp"
|
||||
],
|
||||
"sp",
|
||||
"tp",
|
||||
null
|
||||
],
|
||||
"architectures": [
|
||||
"LlamaForCausalLM"
|
||||
],
|
||||
"attention_bias": false,
|
||||
"attention_dropout": 0.0,
|
||||
"axis_dims": [
|
||||
1,
|
||||
-1,
|
||||
1,
|
||||
1
|
||||
],
|
||||
"axis_names": [
|
||||
"dp",
|
||||
"fsdp",
|
||||
"tp",
|
||||
"sp"
|
||||
],
|
||||
"b_ps": [
|
||||
[
|
||||
"dp",
|
||||
"fsdp"
|
||||
],
|
||||
null,
|
||||
null,
|
||||
null
|
||||
],
|
||||
"backend": null,
|
||||
"bits": null,
|
||||
"bos_token_id": 1,
|
||||
"c_max_position_embeddings": 2048,
|
||||
"easy_method": "train",
|
||||
"embd_pdrop": 0.0,
|
||||
"eos_token_id": 2,
|
||||
"fcm_max_ratio": 0.0,
|
||||
"fcm_min_ratio": 0.0,
|
||||
"flash_attn_key_chunk_size": 1024,
|
||||
"flash_attn_query_chunk_size": 1024,
|
||||
"freq_max_position_embeddings": 2048,
|
||||
"hidden_act": "silu",
|
||||
"hidden_size": 2048,
|
||||
"initializer_range": 0.02,
|
||||
"intermediate_size": 5632,
|
||||
"k_ps": [
|
||||
[
|
||||
"dp",
|
||||
"fsdp"
|
||||
],
|
||||
"sp",
|
||||
"tp",
|
||||
null
|
||||
],
|
||||
"max_position_embeddings": 2048,
|
||||
"model_type": "llama",
|
||||
"num_attention_heads": 32,
|
||||
"num_hidden_layers": 22,
|
||||
"num_key_value_heads": 4,
|
||||
"number_rep_kv": 1,
|
||||
"pretraining_tp": 1,
|
||||
"q_ps": [
|
||||
[
|
||||
"dp",
|
||||
"fsdp"
|
||||
],
|
||||
"sp",
|
||||
"tp",
|
||||
null
|
||||
],
|
||||
"resid_pdrop": 0.0,
|
||||
"rms_norm_eps": 1e-05,
|
||||
"rope_scaling": null,
|
||||
"rope_theta": 10000.0,
|
||||
"scan_layers": true,
|
||||
"scan_mlp_chunk_size": 1024,
|
||||
"tie_word_embeddings": false,
|
||||
"torch_dtype": "float16",
|
||||
"transformers_version": "4.36.2",
|
||||
"use_cache": true,
|
||||
"use_flash_attention": false,
|
||||
"use_pjit_attention_force": false,
|
||||
"use_sacn_mlp": false,
|
||||
"use_shard_map": false,
|
||||
"v_ps": [
|
||||
[
|
||||
"dp",
|
||||
"fsdp"
|
||||
],
|
||||
"sp",
|
||||
"tp",
|
||||
null
|
||||
],
|
||||
"vocab_size": 32000
|
||||
}
|
||||
6
generation_config.json
Normal file
6
generation_config.json
Normal file
@@ -0,0 +1,6 @@
|
||||
{
|
||||
"_from_model_config": true,
|
||||
"bos_token_id": 1,
|
||||
"eos_token_id": 2,
|
||||
"transformers_version": "4.36.2"
|
||||
}
|
||||
3
model.safetensors
Normal file
3
model.safetensors
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:279873cab2e2742d9a629be2d85f0dea7214c87826365199482a8c2077ebb17d
|
||||
size 2200119664
|
||||
24
special_tokens_map.json
Normal file
24
special_tokens_map.json
Normal file
@@ -0,0 +1,24 @@
|
||||
{
|
||||
"bos_token": {
|
||||
"content": "<s>",
|
||||
"lstrip": false,
|
||||
"normalized": false,
|
||||
"rstrip": false,
|
||||
"single_word": false
|
||||
},
|
||||
"eos_token": {
|
||||
"content": "</s>",
|
||||
"lstrip": false,
|
||||
"normalized": false,
|
||||
"rstrip": false,
|
||||
"single_word": false
|
||||
},
|
||||
"pad_token": "</s>",
|
||||
"unk_token": {
|
||||
"content": "<unk>",
|
||||
"lstrip": false,
|
||||
"normalized": false,
|
||||
"rstrip": false,
|
||||
"single_word": false
|
||||
}
|
||||
}
|
||||
93391
tokenizer.json
Normal file
93391
tokenizer.json
Normal file
File diff suppressed because it is too large
Load Diff
3
tokenizer.model
Normal file
3
tokenizer.model
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
|
||||
size 499723
|
||||
41
tokenizer_config.json
Normal file
41
tokenizer_config.json
Normal file
@@ -0,0 +1,41 @@
|
||||
{
|
||||
"add_bos_token": true,
|
||||
"add_eos_token": false,
|
||||
"added_tokens_decoder": {
|
||||
"0": {
|
||||
"content": "<unk>",
|
||||
"lstrip": false,
|
||||
"normalized": false,
|
||||
"rstrip": false,
|
||||
"single_word": false,
|
||||
"special": true
|
||||
},
|
||||
"1": {
|
||||
"content": "<s>",
|
||||
"lstrip": false,
|
||||
"normalized": false,
|
||||
"rstrip": false,
|
||||
"single_word": false,
|
||||
"special": true
|
||||
},
|
||||
"2": {
|
||||
"content": "</s>",
|
||||
"lstrip": false,
|
||||
"normalized": false,
|
||||
"rstrip": false,
|
||||
"single_word": false,
|
||||
"special": true
|
||||
}
|
||||
},
|
||||
"bos_token": "<s>",
|
||||
"clean_up_tokenization_spaces": false,
|
||||
"eos_token": "</s>",
|
||||
"legacy": false,
|
||||
"model_max_length": 1000000000000000019884624838656,
|
||||
"pad_token": "</s>",
|
||||
"padding_side": "right",
|
||||
"sp_model_kwargs": {},
|
||||
"tokenizer_class": "LlamaTokenizer",
|
||||
"unk_token": "<unk>",
|
||||
"use_default_system_prompt": false
|
||||
}
|
||||
Reference in New Issue
Block a user