Update config.json

Refactor: Remove `_name_or_path` and increase `max_position_embeddings` to 8192

- Removed the `_name_or_path` parameter as it's no longer necessary.
- Updated `max_position_embeddings` from 2048 to 8192 for better model capacity.
This commit is contained in:
li lin
2024-10-08 07:43:36 +00:00
committed by system
parent 4160a49c1e
commit 6a5d6095ba

View File

@@ -1,5 +1,4 @@
{
"_name_or_path": "./models/llama3-8b_sft_full_1e-5_bs8000_3_trainv59_a/checkpoint-1596",
"architectures": [
"LlamaForCausalLM"
],
@@ -11,7 +10,7 @@
"hidden_size": 4096,
"initializer_range": 0.02,
"intermediate_size": 14336,
"max_position_embeddings": 2048,
"max_position_embeddings": 4096,
"model_type": "llama",
"num_attention_heads": 32,
"num_hidden_layers": 32,