2025-03-10 09:27:48 +08:00
|
|
|
# Tutorials
|
|
|
|
|
|
|
|
|
|
:::{toctree}
|
2026-01-14 16:50:49 +08:00
|
|
|
:caption: Models
|
2025-03-10 09:27:48 +08:00
|
|
|
:maxdepth: 1
|
2025-12-11 20:53:13 +08:00
|
|
|
Qwen2.5-Omni.md
|
2026-01-14 16:50:49 +08:00
|
|
|
Qwen2.5-7B.md
|
|
|
|
|
Qwen3-Dense.md
|
2025-12-11 20:53:13 +08:00
|
|
|
Qwen-VL-Dense.md
|
|
|
|
|
Qwen3-30B-A3B.md
|
2025-12-08 20:06:46 +08:00
|
|
|
Qwen3-235B-A22B.md
|
2026-01-15 10:56:19 +08:00
|
|
|
Qwen3-VL-30B-A3B-Instruct.md
|
2025-12-19 14:56:17 +08:00
|
|
|
Qwen3-VL-235B-A22B-Instruct.md
|
2026-01-14 16:50:49 +08:00
|
|
|
Qwen3-Coder-30B-A3B.md
|
|
|
|
|
Qwen3_embedding.md
|
2026-01-20 17:36:31 +08:00
|
|
|
Qwen3-VL-Embedding.md
|
2026-01-14 16:50:49 +08:00
|
|
|
Qwen3_reranker.md
|
2026-01-20 17:36:31 +08:00
|
|
|
Qwen3-VL-Reranker.md
|
2026-01-14 16:50:49 +08:00
|
|
|
Qwen3-8B-W4A8.md
|
|
|
|
|
Qwen3-32B-W4A4.md
|
|
|
|
|
Qwen3-Next.md
|
2026-01-08 16:57:20 +08:00
|
|
|
Qwen3-Omni-30B-A3B-Thinking.md
|
2025-12-11 20:53:13 +08:00
|
|
|
DeepSeek-V3.1.md
|
|
|
|
|
DeepSeek-V3.2.md
|
|
|
|
|
DeepSeek-R1.md
|
2026-01-09 16:40:49 +08:00
|
|
|
GLM4.x.md
|
2026-01-14 16:50:49 +08:00
|
|
|
Kimi-K2-Thinking.md
|
|
|
|
|
PaddleOCR-VL.md
|
|
|
|
|
:::
|
|
|
|
|
|
|
|
|
|
:::{toctree}
|
|
|
|
|
:caption: Features
|
|
|
|
|
:maxdepth: 1
|
|
|
|
|
pd_colocated_mooncake_multi_instance.md
|
|
|
|
|
pd_disaggregation_mooncake_single_node.md
|
|
|
|
|
pd_disaggregation_mooncake_multi_node.md
|
|
|
|
|
long_sequence_context_parallel_single_node.md
|
|
|
|
|
long_sequence_context_parallel_multi_node.md
|
2026-02-03 14:52:38 +08:00
|
|
|
suffix_speculative_decoding.md
|
2025-12-11 20:53:13 +08:00
|
|
|
ray
|
2026-01-14 16:50:49 +08:00
|
|
|
:::
|
|
|
|
|
|
|
|
|
|
:::{toctree}
|
|
|
|
|
:caption: Hardware
|
|
|
|
|
:maxdepth: 1
|
|
|
|
|
310p.md
|
2025-03-10 09:27:48 +08:00
|
|
|
:::
|