[Doc] Steps to add a new attention backend (#8155)

This commit is contained in:
Lianmin Zheng
2025-07-18 16:38:26 -07:00
committed by GitHub
parent 7750b91ca8
commit 9c7a46180c
4 changed files with 55 additions and 27 deletions

View File

@@ -13,14 +13,14 @@
# ==============================================================================
"""
The definition of objects transferred between different
processes (TokenizerManager, DetokenizerManager, Controller).
processes (TokenizerManager, DetokenizerManager, Scheduler).
"""
import copy
import uuid
from dataclasses import dataclass, field
from enum import Enum
from typing import TYPE_CHECKING, Any, Dict, List, Optional, Set, Union
from typing import TYPE_CHECKING, Any, Dict, List, Optional, Union
from sglang.srt.managers.schedule_batch import BaseFinishReason
from sglang.srt.multimodal.mm_utils import has_valid_data
@@ -545,7 +545,7 @@ class EmbeddingReqInput:
# The request id.
rid: Optional[Union[List[str], str]] = None
# Dummy sampling params for compatibility
sampling_params: Union[List[Dict], Dict] = None
sampling_params: Optional[Union[List[Dict], Dict]] = None
# Dummy input embeds for compatibility
input_embeds: Optional[Union[List[List[List[float]]], List[List[float]]]] = None
# Whether to log metrics for this request (e.g. health_generate calls do not log metrics)
@@ -953,17 +953,6 @@ class ProfileReqType(Enum):
STOP_PROFILE = 2
class ExpertDistributionReq(Enum):
START_RECORD = 1
STOP_RECORD = 2
DUMP_RECORD = 3
@dataclass
class ExpertDistributionReqOutput:
pass
@dataclass
class ProfileReq:
type: ProfileReqType
@@ -1013,6 +1002,17 @@ class HealthCheckOutput:
pass
class ExpertDistributionReq(Enum):
START_RECORD = 1
STOP_RECORD = 2
DUMP_RECORD = 3
@dataclass
class ExpertDistributionReqOutput:
pass
@dataclass
class Function:
description: Optional[str] = None