初始化项目,由ModelHub XC社区提供模型
Model: reaperdoesntknow/Qemma-sft Source: Original Platform
This commit is contained in:
20
generation_config_think.json
Normal file
20
generation_config_think.json
Normal file
@@ -0,0 +1,20 @@
|
||||
{
|
||||
"bos_token_id": 2,
|
||||
"eos_token_id": 1,
|
||||
"pad_token_id": 0,
|
||||
"do_sample": true,
|
||||
|
||||
"max_new_tokens": 1024,
|
||||
"max_length": 4096,
|
||||
|
||||
"temperature": 0.4,
|
||||
"top_p": 0.90,
|
||||
"top_k": 40,
|
||||
|
||||
"no_repeat_ngram_size": 3,
|
||||
"repetition_penalty": 1.07,
|
||||
|
||||
"stop_sequences": ["</think>", "</reasoning_step>"],
|
||||
"use_cache": true,
|
||||
"transformers_version": "4.57.1"
|
||||
}
|
||||
Reference in New Issue
Block a user