初始化项目,由ModelHub XC社区提供模型

Model: Mushari440/qwen3-8B-sft-v3
Source: Original Platform
This commit is contained in:
ModelHub XC
2026-05-27 15:00:18 +08:00
commit efdcceab27
13 changed files with 726 additions and 0 deletions

23
_merge_debug.json Normal file
View File

@@ -0,0 +1,23 @@
{
"used_fix_mistral_regex": true,
"base": "/mnt/irdc_afs/alothmanmushari/Qwen/Qwen3-8B-Base",
"adapters": [
"output/OALL_DATASETS_NEWSCRIPT_DETECTED_AND_CLEANED_2e5LR/sft/final"
],
"tokenizer_source": "/mnt/irdc_afs/alothmanmushari/Qwen/Qwen3-8B-Base",
"dtype": "bfloat16",
"device_map": "cpu",
"trust_remote_code": true,
"tokenizer_class": "Qwen2Tokenizer",
"model_class": "Qwen3ForCausalLM",
"tokenizer_vocab_size": 151669,
"model_embedding_rows": 151936,
"bos_token": null,
"bos_token_id": null,
"eos_token": "<|endoftext|>",
"eos_token_id": 151643,
"pad_token": "<|endoftext|>",
"pad_token_id": 151643,
"im_start_id": 151644,
"im_end_id": 151645
}