Model: shuoxing/llama3-8b-full-pretrain-junk-tweet-1m-en-reproduce-bs8 Source: Original Platform
13 lines
194 B
JSON
13 lines
194 B
JSON
{
|
|
"bos_token_id": 128000,
|
|
"do_sample": true,
|
|
"eos_token_id": [
|
|
128001,
|
|
128009
|
|
],
|
|
"max_length": 4096,
|
|
"temperature": 0.6,
|
|
"top_p": 0.9,
|
|
"transformers_version": "4.55.0"
|
|
}
|