xc_validation_strategy/main.py

"""
xc_validation_strategy — 主入口

启动后执行一次模型验证任务批量提交，之后保持 HTTP 服务存活。
同时暴露 /health（K8s 探活）和 /status（运行状态）。
"""

import json
import os
import signal
import threading
from datetime import datetime
from http.server import BaseHTTPRequestHandler, ThreadingHTTPServer
from typing import List, Tuple

import requests

# ══════════════════════════════════════════════════════════
#  配置（全部从环境变量读取，不硬编码敏感信息）
# ══════════════════════════════════════════════════════════
BASE_URL           = os.environ.get("BASE_URL", "https://modelhub.org.cn")
SUBMIT_ENDPOINT    = "/adminApi/async/task/create-contest-task"

# 通过 curl -X POST https://modelhub.org.cn/adminApi/user/login 获取后填入
AUTH_TOKEN        = "eyJ0eXAiOiJKV1QiLCJhbGciOiJIUzI1NiJ9.eyJ1c2VyQWNjb3VudCI6Inpob3VzaGFzaGEiLCJpZCI6MTQsInVzZXJSb2xlIjoibGVhZGVyYm9hcmQiLCJleHAiOjE3ODE4NTE0NzcsImlhdCI6MTc4MTI0NjY3N30.p3uvCpG50aLNifNVVXxvzmWJahbLM5K1671FVCtj8E8"
CONTEST_API_TOKEN = "ef1ef82f3c9efee413d602345fbe224d"
CONTRIBUTORS      = "zhoushasha"
GPU_TYPE          = "Cambricon_mlu-370-x8"
TASK_TYPE         = "text-generation"
STRATEGY_ID       = os.environ.get("STRATEGY_ID", "")  # 平台自动注入，无需修改

HTTP_HOST = "0.0.0.0"
HTTP_PORT = 8080

# ══════════════════════════════════════════════════════════
#  模型列表
# ══════════════════════════════════════════════════════════
ALL_MODEL_IDS = [
    # "UCLA-AGI/Gemma-2-9B-It-SPPO-Iter3",
    # "migtissera/SynthIA-7B-v1.3",
    # "TinyLlama/TinyLlama-1.1B-intermediate-step-955k-token-2T",
    # "bigscience/bloomz-1b1",
    # "EleutherAI/pythia-6.9b-deduped",
    # "AvitoTech/avibe",
    # "Enoch/llama-7b-hf",
    # "asingh15/qwen-abs-verl-sft-rephrased-lr5e6-ep1-0109",
    # "PrimeIntellect/INTELLECT-1",
    # "neuralmagic/starcoder2-3b-quantized.w8a8",
    # "Saxo/Linkbricks-Horizon-AI-Korean-Gemma-2-sft-dpo-27B",
    # "HuggingFaceH4/zephyr-7b-gemma-v0.1",
    # "neuralmagic/Llama-2-7b-chat-quantized.w4a16",
    # "neuralmagic/starcoder2-15b-quantized.w8a8",
    # "DAMO-NLP-SG/Qwen2.5-7B-LongPO-128K",
    # "guardrail/llama-2-7b-guanaco-instruct-sharded",
    # "shenzhi-wang/Gemma-2-27B-Chinese-Chat",
    # "pavankumarbalijepalli/phi2-sqlcoder",
    # "neph1/bellman-7b-mistral-instruct",
    # "neuralmagic/Meta-Llama-3-8B-Instruct-quantized.w8a16",
    # "neuralmagic/Qwen2-7B-Instruct-quantized.w8a8",
    # "lamm-mit/BioinspiredLLM",
    # "neuralmagic/Qwen2-7B-Instruct-quantized.w8a16",
    # "dataopsnick/Qwen3-4B-Instruct-2507-zip-rc",
    # "huihui-ai/MicroThinker-3B-Preview",
    # "OrionStarAI/Orion-14B-Base",
    # "georgesung/llama3_8b_chat_uncensored",
    # "FreedomIntelligence/RAG-Instruct-Llama3-3B",
    # "Aryanne/WestSenzu-Swap-7B",
    # "Josephgflowers/Cinder-Phi-2-Test-1",
    # "FreedomIntelligence/Apollo-6B",
    # "Josephgflowers/Tinyllama-1.3B-Cinder-Reason-Test-2",
    # "Josephgflowers/Tinyllama-1.3B-Cinder-Reason-Test",
    # "247labs/Llama-2-7b-Verse-Bot",
    # "praneethposina/customer_support_bot",
    # "KBlueLeaf/TIPO-200M",
    # "norallm/normistral-11b-warm",
    # "theprint/Boptruth-Agatha-7B",
    # "ericflo/Llama-3.1-8B-ContinuedTraining2-FFT",
    # "okwinds/OpenR1-Qwen-7B",
    # "ruohuaw/deepquery-3b-sft",
    # "theprint/Boptruth-NeuralMonarch-7B",
    # "MaziyarPanahi/calme-3.1-qwenloi-3b",
    # "alperiox/trendyol-7b-base-v1-mtLoRA_entr",
    # "theprint/phi-3-mini-4k-python",
    # "uukuguy/speechless-nl2sql-ds-6.7b",
    # "uukuguy/speechless-coder-ds-6.7b",
    # "tybrs/llama-guard-quant",
    # "Josephgflowers/TinyLlama-3T-Cinder-v1.3",
    # "mlabonne/Darewin-7B-v2",
    # "TeichAI/Qwen3-1.7B-Gemini-2.5-Flash-Lite-Preview-Distill",
    # "TeichAI/Nemotron-Orchestrator-8B-DeepSeek-v3.2-Speciale-Distill",
    # "shadowml/BeagSake-7B",
    # "lex-hue/Delexa-7b",
    # "h2oai/h2o-danube3-500m-chat",
    # "bigcode/gpt_bigcode-santacoder",
    # "openlm-research/open_llama_7b",
    # "upstage/SOLAR-10.7B-v1.0",
    # "prithivMLmods/Phi-3.5-Mini-Xalate",
    # "prithivMLmods/Qwen3-Bifrost-SOL-4B-GUFF",
    # "prithivMLmods/Volans-Opus-14B-Exp",
    # "prithivMLmods/Viper-OneCoder-UIGEN",
    # "prithivMLmods/Tucana-Opus-14B-r999",
    # "prithivMLmods/Sombrero-Opus-14B-Sm5",
    # "prithivMLmods/Sombrero-Opus-14B-Sm4",
    # "prithivMLmods/Reasoning-SmolLM2-135M",
    # "prithivMLmods/Sombrero-Opus-14B-Sm1",
    # "prithivMLmods/LwQ-10B-Instruct",
    # "prithivMLmods/Sombrero-Opus-14B-Elite5",
    # "prithivMLmods/Eridanus-Opus-14B-r999",
    # "prithivMLmods/Equuleus-Opus-14B-Exp",
    # "prithivMLmods/Epimetheus-14B-Axo",
    # "prithivMLmods/Phi-4-Math-IO",
    # "prithivMLmods/Omni-Reasoner4-Merged",
    # "prithivMLmods/Pegasus-Opus-14B-Exp",
    # "prithivMLmods/Elita-1",
    # "prithivMLmods/Delta-Pavonis-Qwen-14B",
    # "prithivMLmods/Nu2-Lupi-Qwen-14B",
    # "prithivMLmods/Coma-II-14B",
    # "MaziyarPanahi/calme-2.7-qwen2-7b",
    # "prithivMLmods/Monocerotis-V838-14B",
    # "prithivMLmods/Calcium-Opus-14B-Merge",
    # "prithivMLmods/Calcium-Opus-14B-Elite3",
    # "prithivMLmods/Calcium-Opus-14B-Elite2-R1",
    # "prithivMLmods/Calcium-Opus-14B-Elite2",
    # "prithivMLmods/Calcium-Opus-14B-Elite-Stock",
    # "prithivMLmods/Megatron-Opus-14B-2.1",
    # "prithivMLmods/Blaze.1-27B-Reflection",
    # "prithivMLmods/Megatron-Corpus-14B-Exp.v2",
    # "prithivMLmods/Megatron-Corpus-14B-Exp",
    # "GAIR/autoj-bilingual-6b",
    # "TheBloke/airoboros-7b-gpt4-fp16",
    # "Undi95/Mistral-11B-OmniMix9",
    # "PKU-Alignment/ProgressGym-HistLlama3-8B-C016-pretrain-v0.2",
    # "PKU-Alignment/ProgressGym-HistLlama3-8B-C017-instruct-v0.2",
    # "mlabonne/NeuralDarewin-7B",
    # "0xgr3y/Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-tall_tame_panther",
    # "openlm-research/open_llama_3b_v2",
    # "Nobitaxi/InternLM2-chat-7B-SQL",
    # "testUser/Qwen3-1.7b-Medical-R1-sft",
    # "mlabonne/Zebrafish-7B",
    # "mlabonne/NeuralPipe-7B-slerp",
    # "laion/openthoughts-4-code-qwen3-32b-annotated-7k_qwen3-1.7B_10k",
    # "Fengshenbang/Ziya-LLaMA-13B-v1.1",
    # "arcee-ai/Saul-Instruct-Mistral-7B-Instruct-v0.2-Slerp",
    # "arcee-ai/Saul-Instruct-Clown-7b",
    # "prithivMLmods/Megatron-Opus-7B-Exp",
    # "Vikhrmodels/QVikhr-3-8B-Instruction",
    # "TheBloke/Nous-Hermes-13B-SuperHOT-8K-fp16",
    # "TheBloke/UltraLM-13B-fp16",
    # "PocketDoc/Dans-TotSirocco-7b",
    # "LLM-Research/Meta-Llama-3.1-8B",
    # "Qwen/Qwen2.5-Coder-32B",
    # "Qwen/Qwen2.5-7B-Instruct-1M",
    # "Qwen/Qwen2-57B-A14B-Instruct",
    # "Qwen/Qwen2.5-14B-Instruct-1M",
    # "Qwen/Qwen-1_8B-Chat",
    # "Qwen/Qwen1.5-MoE-A2.7B-Chat",
    # "Qwen/Qwen1.5-MoE-A2.7B",
    # "Qwen/Qwen1.5-14B-Chat",
    # "Qwen/Qwen1.5-14B",
    # "Qwen/Qwen-14B",
    # "deepseek-ai/DeepSeek-Coder-V2-Lite-Base",
    # "TheBloke/tulu-13B-fp16",
    # "TheBloke/Kimiko-Mistral-7B-fp16",
    # "TheBloke/Llama-2-13B-fp16",
    # "mlabonne/Monarch-7B",
    # "TheBloke/tulu-7B-fp16",
    # "01ai/Yi-9B",
    # "TheBloke/koala-7B-HF",
    # "AI-ModelScope/txgemma-2b-predict",
    # "LLM-Research/OLMo-7B-0724-SFT-hf",
    # "JsonZhang02/Llama3.2-1B-PCL",
    # "PKU-Alignment/ProgressGym-HistLlama3-8B-C019-instruct-v0.2",
    # "PKU-Alignment/ProgressGym-HistLlama3-8B-C016-instruct-v0.2",
    # "FreedomIntelligence/AceGPT-v1.5-13B-Chat",
    # "MediaTek-Research/Breeze-7B-Base-v0_1",
    # "OpenBuddy/openbuddy-llama3-8b-v21.1-8k",
    # "HIT-TMG/Mixtral_13B_Chat_RAG-Reader",
    # "PKU-Alignment/ProgressGym-HistLlama3-8B-C014-pretrain-v0.2",
    # "arcee-ai/arcee-lite",
    # "X-D-Lab/MindChat-Qwen2-4B",
    # "mlabonne/NeuralMonarch-7B",
    # "ibm-granite/granite-3b-code-instruct-2k",
    # "LLM-Research/OLMo-7B-Twin-2T-hf",
    # "PocketDoc/Dans-AdventurousWinds-Mk2-7b",
    # "LLM-Research/Qwen2-Math-7B",
    # "MediaTek-Research/Breeze-7B-Base-v1_0",
    # "LLM-Research/layerskip-llama2-13B",
    # "prithivMLmods/TESS-QwenRe-1.5B",
    # "prithivMLmods/Octantis-QwenR1-1.5B",
    # "prithivMLmods/Qwen3-1.7B-ft-bf16",
    # "prithivMLmods/Theta-Crucis-0.6B-Turbo1",
    # "prithivMLmods/Omega-Qwen3-Atom-8B",
    # "prithivMLmods/Mintaka-Qwen3-1.6B-V3.1",
    # "NousResearch/Yarn-Llama-2-7b-64k",
    # "prithivMLmods/Panacea-MegaScience-Qwen3-1.7B",
    # "prithivMLmods/TOI-157-Phi-4-Reasoning-Mini",
    # "prithivMLmods/Vulpecula-4B",
    # "LLM-Research/OLMo-7B-0424-hf",
    # "LLM-Research/OLMo-7B-hf",
    # "LLM-Research/OLMo-7B-SFT-hf",
    # "AI-ModelScope/starcoder2-7b",
    # "LLM-Research/OLMo-7B-0724-hf",
    # "OpenBMB/BitCPM4-1B",
    # "LLM-Research/truthfulqa-truth-judge-llama2-7B",
    # "LLM-Research/OLMo-1B-0724-hf",
    # "HIT-TMG/Qwen1.5-14B-Chat_RAG-Reader",
    # "OpenBMB/MiniCPM4-MCP",
    # "AI-ModelScope/sqlcoder-7b-2",
    # "FuseAI/OpenChat-3.5-7B-SOLAR-v2.0",
    # "JsonZhang02/Llama3.2-1B-SFT",
    # "MaziyarPanahi/neural-chat-7b-v3-2-Mistral-7B-Instruct-v0.1",
    # "MaziyarPanahi/SauerkrautLM-7b-HerO-Mistral-7B-Instruct-v0.1",
    # "prithivMLmods/Segue-Qwen3_DeepScaleR-Preview",
    # "NovaSky-AI/Sky-T1-7B-Zero",
    # "PKU-Alignment/ProgressGym-HistLlama3-8B-C020-pretrain-v0.2",
    # "NovaSky-AI/Sky-T1-7B-step2",
    # "NousResearch/CodeLlama-7b-hf-flash",
    # "LLM-Research/layerskip-llama3-8B",
    # "LLM-Research/OLMo-1B-hf",
    # "PKU-Alignment/ProgressGym-HistLlama3-8B-C018-pretrain-v0.2",
    # "NousResearch/CodeLlama-7b-Instruct-hf-flash",
    # "Nexusflow/NexusRaven-V2-13B",
    # "AI-ModelScope/NuExtract-v1.5",
    # "NousResearch/Nous-Capybara-3B-V1.9",
    # "NousResearch/Nous-Capybara-7B-V1",
    # "NousResearch/Yarn-Solar-10b-32k",
    # "LLM-Research/Llama-Guard-4-12B",
    # "OpenPipe/gemma-3-4b-it-text-only-2",
    # "OpenPipe/Deductive-Reasoning-Qwen-14B",
    # "OpenPipe/gemma-3-12b-it-text-only",
    # "AI-MO/NuminaMath-7B-CoT",
    # "GAIR/Abel-7B-001",
    # "prithivMLmods/Novaeus-Promptist-7B-Instruct",
    # "SakanaAI/EvoLLM-JP-v1-7B",
    # "FreedomIntelligence/Apollo-1.8B",
    # "PKU-Alignment/ProgressGym-HistLlama3-8B-C013-instruct-v0.2",
    # "PKU-Alignment/ProgressGym-HistLlama3-8B-C013-pretrain-v0.2",
    # "PKU-Alignment/ProgressGym-HistLlama3-8B-C015-pretrain-v0.2",
    # "PKU-Alignment/ProgressGym-HistLlama3-8B-C014-instruct-v0.2",
    # "PKU-Alignment/ProgressGym-HistLlama3-8B-C021-instruct-v0.2",
    # "NousResearch/Meta-Llama-3.1-8B",
    # "OpenPipe/Qwen3-14B-Instruct",
    # "unsloth/OpenHermes-2.5-Mistral-7B",
    # "OpenBuddy/openbuddy-mistral-22b-v21.1-32k",
    # "FlyDutch/telechat2-7b-Cot",
    # "HuggingFaceH4/mistral-7b-sft-alpha",
    # "PAI/pai-qwen1_5-7b-doc2qa",
    # "PKU-Alignment/ProgressGym-HistLlama3-8B-C018-instruct-v0.2",
    # "Magpie-Align/Llama-3-8B-Tulu-330K",
    # "prithivMLmods/Blaze.1-27B-Preview",
    # "allenai/OLMo-7B-0424-SFT-hf",
    # "mlabonne/Meta-Llama-3-8B",
    # "LLM-Research/layerskip-codellama-7B",
    # "prithivMLmods/Sculptor-Qwen3_Med-Reasoning",
    # "prithivMLmods/SmolLM2-360M-Grpo-r999",
    # "prithivMLmods/SmolLM2-1.7B-Open-Thought",
    # "LLM-Research/open-instruct-llama2-sharegpt-7b",
    # "prithivMLmods/SmolLM2_135M_Grpo_Checkpoint",
    # "OpenBuddy/openbuddy-qwen2.5llamaify-14b-v23.1-200k",
    # "OpenBuddy/openbuddy-zero-3b-v21.2-32k",
    # "YeungNLP/firefly-llama2-7b-chat",
    # "OpenBuddy/openbuddy-zero-14b-v22.3-32k",
    # "OpenBuddy/openbuddy-yi1.5-9b-v21.1-32k",
    # "FuseAI/OpenChat-3.5-7B-Starling-v2.0",
    # "prithivMLmods/Qwen-7B-Distill-Reasoner",
    # "FuseAI/OpenChat-3.5-7B-InternLM-v2.0",
    # "prithivMLmods/Galactic-Qwen-14B-Exp1",
    # "prithivMLmods/Sombrero-R1-14B-Elite13",
    # "prithivMLmods/Sombrero-Opus-14B-Elite13",
    # "TheBloke/Planner-7B-fp16",
    # "AI-ModelScope/speed-synthesis-8b-senior",
    # "PocketDoc/Dans-AdventurousWinds-7b",
    # "MaziyarPanahi/calme-3.2-baguette-3b",
    # "MaziyarPanahi/calme-3.2-instruct-3b",
    # "IntervitensInc/intv_ai_mk11",
    # "prithivMLmods/Muscae-Qwen3-UI-Code-4B",
    # "NousResearch/Llama-2-7b-hf",
    # "prithivMLmods/Pocket-Llama-3.2-3B-Instruct",
    # "OpenBuddy/openbuddy-openllama-13b-v7-fp16",
    # "LLM-Research/WildLlama-7b-assistant-only",
    # "prithivMLmods/Raptor-X2",
    # "OpenBuddy/openbuddy-qwen1.5-14b-v20.1-32k",
    # "NaniDAO/Meta-Llama-3.1-8B-Instruct-ablated-v1",
    # "LLM-Research/OLMo-7B-Instruct-hf",
    # "OpenBuddy/openbuddy-zen-3b-v21.2-32k",
    # "OpenBuddy/openbuddy-qwen1.5-14b-v21.1-32k",
    # "LLM-Research/llama2-7b-WildJailbreak",
    # "JunHowie/MiniCPM4-8B",
    # "OpenBuddy/openbuddy-coder-15b-v10-bf16",
    # "JunHowie/MiniCPM4-0.5B",
    # "OpenDevin/CodeQwen1.5-7B-OpenDevin",
    # "OpenBuddy/openbuddy-mistral-10b-v17.1-32k",
    # "PAI/DistilQwen2.5-DS3-0324-7B",
    # "OpenBuddy/openbuddy-llama2-13b64k-v15",
    # "OpenBuddy/openbuddy-falcon-7b-v5-fp16",
    # "NousResearch/Hermes-2-Theta-Llama-3-8B",
    # "NousResearch/Hermes-2-Pro-Mistral-7B",
    # "OpenBuddy/openbuddy-openllama-7b-v5-fp16",
    # "PAI/DistillQwen-ThoughtY-8B",
    # "BSC-LT/salamandra-2b",
    # "pfnet/nekomata-7b-pfn-qfin-inst-merge",
    # "BSC-LT/experimental7b-rag-instruct",
    # "PKU-Alignment/ProgressGym-HistLlama3-8B-C019-pretrain-v0.2",
    # "OpenBuddy/OpenBuddy-R10528DistillQwen-14B-v27.4-200K",
    # "OpenBuddy/OpenBuddy-R10528DistillQwen-14B-v27.1",
    # "OpenBuddy/SimpleChat-4B-V1",
    # "AI-ModelScope/granite-8b-code-base-4k",
    # "mlabonne/NeuralHermes-2.5-Mistral-7B",
    # "BSC-LT/experimental7b-rag",
    # "prithivMLmods/SmolLM2_135M_Grpo_Gsm8k",
    # "OpenBuddy/openbuddy-zen-3b-v21.1-32k",
    # "PKU-Alignment/ProgressGym-HistLlama3-8B-C015-instruct-v0.2",
    # "prithivMLmods/QwQ-LCoT1-Merged",
    # "mlabonne/NeuralBeagle14-7B",
    # "PKU-Alignment/ProgressGym-HistLlama3-8B-C020-instruct-v0.2",
    # "mlabonne/NeuralMarcoro14-7B",
    # "PKU-Alignment/ProgressGym-HistLlama3-8B-C017-pretrain-v0.2",
    # "FuseAI/OpenChat-3.5-7B-Mixtral-v2.0",
    # "mlabonne/FrankenMonarch-7B",
    # "stabilityai/stablelm-tuned-alpha-3b",
    # "prithivMLmods/Viper-Coder-v1.5-r999",
    # "prithivMLmods/Galactic-Qwen-14B-Exp2",
    # "HuggingFaceTB/cosmo-1b",
    # "LLM-Research/WildLlama-7b-user-assistant",
    # "OpenBuddy/openbuddy-llama2-13b-v8.1-fp16",
    # "prithivMLmods/Regulus-Qwen3-R1-Llama-Distill-1.7B",
    # "LLM-Research/OLMo-7B-0424-SFT-hf",
    # "huihui-ai/MicroThinker-1B-Preview",
    # "OpenBuddy/openbuddy-openllama-3b-v10-bf16",
    # "LLM-Research/digital-socrates-13b",
    # "prithivMLmods/Viper-Coder-v1.6-r999",
    # "prithivMLmods/Magpie-Qwen-DiMind-1.7B",
    # "BAAI/CareBot_Medical_multi-llama3-8b-base",
    # "NousResearch/Meta-Llama-3-8B",
    # "OpenBuddy/openbuddy-llama2-13b-v15p1-64k",
    # "NousResearch/Yarn-Mistral-7b-64k",
    # "PrimeIntellect/DeepSeek-R1-Distill-Qwen-1.5B",
    # "Undi95/Meta-Llama-3-8B-Instruct-hf",
    # "FuseAI/OpenChat-3.5-7B-Mixtral",
    # "prithivMLmods/Viper-Coder-Hybrid-v1.3",
    # "OpenBuddy/openbuddy-qwen2.5llamaify-7b-v23.1-200k",
    # "LLM-Research/mistral-7b",
    # "OpenBuddy/openbuddy-qwen2.5llamaify-14b-v23.3-200k",
    # "prithivMLmods/Viper-Coder-HybridMini-v1.3",
    # "OpenBuddy/openbuddy-atom-13b-v9-bf16",
    # "OpenBuddy/openbuddy-llama3.2-3b-v23.2-131k",
    # "ibm-granite/granite-3b-code-instruct-128k",
    # "PierreZCW/Breeze-7B-Instruct-v1_0",
    # "mlabonne/Marcoro14-7B-slerp",
    # "AI-ModelScope/openbuddy-falcon-7b-v15-fp16",
    # "AI-ModelScope/falcon-7b",
    # "BAAI/AquilaChat2-7B",
    # "PrimeIntellect/Qwen3-0.6B",
    # "OuteAI/Lite-Oute-1-65M-Instruct",
    # "AI-ModelScope/granite-3b-code-instruct-128k",
    # "PrimeIntellect/Qwen3-8B",
    # "OpenBuddy/openbuddy-falcon-7b-v6-bf16",
    # "MaziyarPanahi/calme-3.1-instruct-3b",
    # "LLM-Research/open-instruct-llama2-sharegpt-dpo-7b",
    # "PocketDoc/Dans-PersonalityEngine-v1.0.0-8b",
    # "FuseAI/FuseChat-Llama-3.1-8B-Instruct",
    # "OpenBuddy/openbuddy-mixtral-7bx8-v18.1-32k",
    # "OpenBuddy/openbuddy-deepseekcoder-6b-v16.1-32k",
    # "HuggingFaceTB/SmolLM-1.7B",
    # "LLM-Research/Llama-4-Scout-17B-16E-Instruct",
    # "argilla/distilabeled-Marcoro14-7B-slerp-full",
    # "HuggingFaceTB/SmolLM2-1.7B",
    # "argilla/distilabeled-Marcoro14-7B-slerp",
    # "l3utterfly/open-llama-3b-v2-layla",
    "motherduckdb/DuckDB-NSQL-7B-v0.1",
    "ilkayO/Karga-2B-Thinking",
    "vtgh1602/legal-llm-v1-qwen25-7b-merged",
    "Alelcv27/Llama3.2-3B-Dare-Math-Code",
    "adamo1139/aya-expanse-8b-ungated",
    "Alelcv27/Llama3.2-3B-TIES-Math-Code",
    "chanwit/flux-7b-v0.1",
    "nfaheem/Marcoroni-7b-DPO-Merge",
    "trillionlabs/android_control_ER_index_1000",
    "biodatlab/ec-raft",
    "LLM4Binary/llm4decompile-1.3b-v1.5",
    "LLM4Binary/llm4decompile-1.3b-v2",
    "Ramikan-BR/tinyllama-coder-py-v11",
    "maywell/Synatra-7B-Instruct-v0.2",
    "Tapask/telecom-oss-8b-merged",
    "LeoLM/leo-hessianai-7b-chat-bilingual",
    "malhajar/Mistral-7B-v0.2-meditron-turkish",
    "maywell/PiVoT-SOLAR-10.7B-RP",
    "allenai/intent-aware-lfqa-llama3-8b-intent-explicit",
    "Skywork/Skywork-Critic-Llama-3.1-8B",
    "proxectonos/Llama-3.1-Carballo-Instr3",
    "maywell/Synatra-10.7B-v0.4",
    "proxectonos/Carballo-Legal",
    "UmbrellaInc/Wesker-Project-3.2-1B",
    "inclusionAI/AReaL-boba-2-32B",
    "migtissera/Synthia-v3.0-11B",
    "vicgalle/RoleBeagle-11B",
    "ehristoforu/RQwen-v0.1",
    "llm-jp/llm-jp-4-32b-a3b-base",
    "bigcode/starcoder-co-format",
    "lyogavin/Anima-7B-100K",
    "raincandy-u/Llama-3-Aplite-Instruct-4x8B-MoE",
    "mii-community/zefiro-7b-dpo-ITA",
    "thirdeyeai/SmolLM2-1.7B-Instruct-Uncensored",
    "LeoLM/leo-hessianai-7b",
    "ibm-granite/GneissWeb.7B_ablation_model_on_350B_FineWeb.Edu.seed3",
    "Xtra-Computing/XtraGPT-7B",
    "bigcode/starcoder-co-target",
    "uproai/Rose-2x7B",
    "ReDiX/Qwen2.5-0.5B-Instruct-ITA",
    "CLMBR/binding-c-command-transformer-0",
    "MaLA-LM/emma-500-llama3.1-8b-bi",
    "freewheelin/free-solar-evo-v0.13",
    "bigcode/starcoder-xo",
    "DavidAU/Rocinante-X-12B-v1-Heretic-Uncensored",
    "yam-peleg/Experiment22-7B",
    "jackf857/qwen3-8b-base-beta-dpo-hh-harmless-4xh200-batch-64",
    "ypwang61/One-Shot-RLVR-Qwen2.5-Math-1.5B-pi1",
    "Vladimirlv/ru-promptriever-qwen3-4b-attn",
    "starlight-ai/MedSearcher-1.7B",
    "lzumot/MODULARMOJO_Mistral_V1",
    "hfl/chinese-alpaca-2-1.3b-rlhf",
    "CloneBO/OracleLM",
    "HelpingAI/MediKAI",
    "VillanovaAI/Villanova-2B-2603",
    "princeton-nlp/SWE-Llama-13b",
    "MBZUAI/bactrian-x-llama-13b-merged",
    "sbordt/OLMo-2-1B-Mid",
    "Kyleyee/rDPO_hh-seed2",
    "EleutherAI/early_unlearning_annealing_baseline_ga_v3_interleaved_1_in_50_original_wmdp_papers",
    "hector-gr/RLCR-5x-priority-overconf-math",
    "Neura-Tech-AI/Neuron-14B",
    "pandaman007/llama-3.1-8b-instruct-sycophantic-steered-L12-a5",
    "idopinto/qwen3-14b-nt-gen-inv-sft-v2.2-full",
    "katanemo/Arch-Function-3B",
    "sbordt/OLMo-2-1B-1x-WD0-LR16",
    "sbordt/OLMo-2-1B-1x-WD0-LR08",
    "sbordt/OLMo-2-1B-1x-WD0-LR32",
    "arkoda/arkoda-7b-v7-2-1",
    "Kazuki1450/Qwen3-1.7B-Base_dsum_3_6_0p8_0p0_1p0_grpo_dr_grpo_42_rule",
    "EleutherAI/deep_aversion_pretraining_filtered_gdiff_v1_interleaved_1_in_100_gclip-0.5",
    "W-61/llama-3-8b-base-ultrachat-sft-4xh100",
    "xw1234gan/olympiads_Main_fixed_BaseAnchor_3B_step_8",
    "kenny2021/episodic-nothink4-merged",
    "yilmazzey/qwen2_5_7b-abstract-finetuned-ep2-b8",
    "kenny2021/episodic-nothink4-simpo-merged",
    "maxim1eu/amelia-32b-dpo-merged",
    "open-unlearning/unlearn_tofu_Llama-3.2-1B-Instruct_forget10_SimNPO_lr5e-05_b3.5_a1_d1_g0.25_ep5",
    "Cisco1963/llmplasticity-en_de_instant_0.125_1-seed42",
    "Cisco1963/llmplasticity-zh_en_linear_0.25_1-seed42",
    "tyson0420/stack_llama-clang",
    "saishf/Fett-uccine-11B-Experiment",
    "Cisco1963/llmplasticity-fi_de_instant_0.5_1-seed42",
    "Cisco1963/llmplasticity-en_de_linear_0.125_1-seed42",
    "Cisco1963/llmplasticity-zh_fi_instant_0.125_1-seed42",
    "Cisco1963/llmplasticity-fi_en_instant_0.125_1-seed42",
    "unsloth/codellama-7b",
    "MCult01/muse-qwen3-8b",
    "zero9tech/Qwen3-4B-Data-Science-Insight-TR-16.2K",
    "LorenaYannnnn/bold_formatting-Qwen3-0.6B-baseline_all_tokens-seed_2",
    "LorenaYannnnn/bold_formatting-Qwen3-0.6B-baseline_all_tokens-seed_1",
    "yufeng1/Olmo3-7B-textsummarization-type6-e1-alpha0_625-2",
    "Haeryz/Deepseek-TPPO-V2-Temp",
    "yufeng1/OpenThinker-7B-type6-e1-max-alpha0_3125-2",
    "FinaPolat/Qwen3_8B_openED",
    "myfi/parser_model_ner_4.13_ep4",
    "vimalnar/aware-ai-2nd",
    "flammenai/flammen11-mistral-7B",
    "Vikhrmodels/Vikhr-Qwen-2.5-0.5b-Instruct",
    "penfever/kimi-k2-swesmith_with_plain_docker-sandboxes-maxeps-32k",
    "Narsil/amall-7b",
    "kmseong/llama2_7b_chat-MBPP-FT-lr5e-5",
    "Cisco1963/llmplasticity-en_zh_linear_0.125_1-seed42",
    "Cisco1963/llmplasticity-zh_en_instant_0.25_1-seed42",
    "Cisco1963/llmplasticity-zh_fi_instant_0.5_1-seed42",
    "Cisco1963/llmplasticity-de_en_linear_0.5_1-seed42",
    "RedHatAI/SmolLM-360M-Instruct-quantized.w8a8",
    "togethercomputer/Llama-2-7B-32K-Instruct",
    "Undi95/ReMM-v2-Kimiko-v2-13B",
    "jackf857/qwen3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4",
    "YeungNLP/firefly-llama2-13b-base",
    "gplsi/Aitana-2B-S-base-IP-1.0",
    "princeton-nlp/Llemma-7B-32K-MathMix",
    "darkmatter999/llama-2-7b-competetivecoding",
    "RedHatAI/Qwen2-0.5B-Instruct-quantized.w8a8",
    "zorobin/mistral-class-shishya-7b-ep3",
    "vicgalle/Mixtral-7Bx2-truthy",
    "sethuiyer/Chikuma_10.7B",
    "360zhinao/Light-IF-14B",
    "EscapeJeju/qwen25_1_5b_korean_unsloth",
]

# ══════════════════════════════════════════════════════════
#  全局状态（供 /status 展示）
# ══════════════════════════════════════════════════════════
_state = {
    "strategy_id":   STRATEGY_ID,
    "phase":         "starting",   # starting | submitting | done | error
    "total":         len(ALL_MODEL_IDS),
    "submitted":     0,
    "failed":        0,
    "started_at":    None,
    "finished_at":   None,
}
_shutdown = threading.Event()

# ══════════════════════════════════════════════════════════
#  HTTP 服务
# ══════════════════════════════════════════════════════════
class Handler(BaseHTTPRequestHandler):
    def do_GET(self):
        if self.path == "/health":
            self._json({"status": "ok"})
        elif self.path == "/status":
            self._json(_state)
        else:
            self._json({"error": "not found"}, 404)

    def _json(self, body: dict, code: int = 200):
        payload = json.dumps(body, default=str).encode()
        self.send_response(code)
        self.send_header("Content-Type", "application/json")
        self.send_header("Content-Length", str(len(payload)))
        self.end_headers()
        self.wfile.write(payload)

    def log_message(self, fmt, *args):
        print(f"[http] {self.address_string()} {fmt % args}", flush=True)


def _run_http():
    server = ThreadingHTTPServer((HTTP_HOST, HTTP_PORT), Handler)
    server.timeout = 1
    print(f"[http] 监听 {HTTP_HOST}:{HTTP_PORT}", flush=True)
    while not _shutdown.is_set():
        server.handle_request()
    server.server_close()
    print("[http] 已关闭", flush=True)

# ══════════════════════════════════════════════════════════
#  业务逻辑
# ══════════════════════════════════════════════════════════
def _submit_task(token: str, model_id: str) -> Tuple[bool, str]:
    headers = {
        "Content-Type": "application/json",
        "Authorization": f"Bearer {token}",
    }
    config_content = f"""docker_image: harbor.4pd.io/hardcore-tech/cambricon-mlu370-pytorch:v25.01-torch2.5.0-torchmlu1.24.1-ubuntu22.04-py310
nv_docker_image: harbor.4pd.io/dooke/vllm/vllm/vllm-openai:v0.11.0
framework: vllm
storage: gpfs
modelhub_options:
  srcRelativePath: leaderboard/modelHubXC/{model_id}
  mountPoint: /model
sut_config:
  values:
    gpu_num: 1
    env:
      - name: MAX_MODEL_LEN
        value: 8192
    command: ["vllm", "serve", "/model", "--port", "8000", "--served-model-name", "llm", "--max-model-len", "8192", "--trust-remote-code", "--dtype", "float16"]
ref_config:
  values:
    cpu_num: 2
    gpu_num: 1
    env:
      - name: MAX_MODEL_LEN
        value: 8192
    command: ["vllm", "serve", "/model", "--port", "80", "--served-model-name", "llm", "--max-model-len", "8192", "--trust-remote-code", "--dtype", "float16"]
"""
    payload = {
        "contestApiToken": CONTEST_API_TOKEN,
        "contributors":    CONTRIBUTORS,
        "gpuTypes":        [GPU_TYPE],
        "taskType":        TASK_TYPE,
        "modelId":         model_id,
        "framework":       "vllm",
        "strategyId":      STRATEGY_ID,   # 平台要求
        "submissionConfig": [{
            "config":   config_content,
            "gpuType":  GPU_TYPE,
            "taskType": TASK_TYPE,
        }],
    }
    print(f"[payload] {json.dumps(payload, indent=2, ensure_ascii=False)}", flush=True)
    try:
        resp = requests.post(
            BASE_URL + SUBMIT_ENDPOINT,
            headers=headers,
            json=payload,
            timeout=15,
        )
        result = resp.json()
        if result.get("code") == 0:
            task_id = result.get("data", {}).get("id", "")
            print(f"[worker] OK  {model_id}  task_id={task_id}", flush=True)
            return True, task_id
        else:
            print(f"[worker] FAIL {model_id}: {result.get('message')}", flush=True)
            return False, ""
    except Exception as e:
        print(f"[worker] ERROR {model_id}: {e}", flush=True)
        return False, ""


def _run_worker():
    _state["started_at"] = datetime.utcnow().isoformat()
    _state["phase"] = "submitting"

    successful: List[Tuple[str, str]] = []
    token = AUTH_TOKEN
    print("[worker] 使用预设 Token，跳过登录", flush=True)

    for model_id in ALL_MODEL_IDS:
        if _shutdown.is_set():
            break
        ok, task_id = _submit_task(token, model_id)
        if ok:
            _state["submitted"] += 1
            successful.append((task_id, model_id))
        else:
            _state["failed"] += 1

    # 写入结果文件
    try:
        with open("submitted_validation_tasks.txt", "w", encoding="utf-8") as f:
            for tid, mid in successful:
                f.write(f"{tid}\t{mid}\n")
    except Exception:
        pass

    _state["finished_at"] = datetime.utcnow().isoformat()
    _state["phase"] = "done"
    print(
        f"[worker] 完成  submitted={_state['submitted']}  failed={_state['failed']}",
        flush=True,
    )
    # 提交完成后继续保持进程存活，等待平台停止

# ══════════════════════════════════════════════════════════
#  入口
# ══════════════════════════════════════════════════════════
def _handle_signal(signum, _frame):
    print(f"[main] 收到信号 {signum}，正在关闭...", flush=True)
    _shutdown.set()


def main():
    signal.signal(signal.SIGTERM, _handle_signal)
    signal.signal(signal.SIGINT,  _handle_signal)

    # HTTP 服务线程
    http_thread = threading.Thread(target=_run_http, daemon=False)
    http_thread.start()

    # 提交任务线程
    worker_thread = threading.Thread(target=_run_worker, daemon=True)
    worker_thread.start()

    # 主线程等待 shutdown
    _shutdown.wait()
    print("[main] 等待 HTTP 服务关闭...", flush=True)
    http_thread.join(timeout=5)
    print("[main] 退出", flush=True)


if __name__ == "__main__":
    main()