Files
qwen3-8B-sft-v3/_merge_debug.json
ModelHub XC efdcceab27 初始化项目,由ModelHub XC社区提供模型
Model: Mushari440/qwen3-8B-sft-v3
Source: Original Platform
2026-05-27 15:00:18 +08:00

23 lines
695 B
JSON

{
"used_fix_mistral_regex": true,
"base": "/mnt/irdc_afs/alothmanmushari/Qwen/Qwen3-8B-Base",
"adapters": [
"output/OALL_DATASETS_NEWSCRIPT_DETECTED_AND_CLEANED_2e5LR/sft/final"
],
"tokenizer_source": "/mnt/irdc_afs/alothmanmushari/Qwen/Qwen3-8B-Base",
"dtype": "bfloat16",
"device_map": "cpu",
"trust_remote_code": true,
"tokenizer_class": "Qwen2Tokenizer",
"model_class": "Qwen3ForCausalLM",
"tokenizer_vocab_size": 151669,
"model_embedding_rows": 151936,
"bos_token": null,
"bos_token_id": null,
"eos_token": "<|endoftext|>",
"eos_token_id": 151643,
"pad_token": "<|endoftext|>",
"pad_token_id": 151643,
"im_start_id": 151644,
"im_end_id": 151645
}