Files
Qemma-sft/generation_config_think.json

20 lines
363 B
JSON
Raw Permalink Normal View History

{
"bos_token_id": 2,
"eos_token_id": 1,
"pad_token_id": 0,
"do_sample": true,
"max_new_tokens": 1024,
"max_length": 4096,
"temperature": 0.4,
"top_p": 0.90,
"top_k": 40,
"no_repeat_ngram_size": 3,
"repetition_penalty": 1.07,
"stop_sequences": ["</think>", "</reasoning_step>"],
"use_cache": true,
"transformers_version": "4.57.1"
}