[Doc] Steps to add a new attention backend (#8155)
This commit is contained in:
@@ -13,14 +13,14 @@
|
||||
# ==============================================================================
|
||||
"""
|
||||
The definition of objects transferred between different
|
||||
processes (TokenizerManager, DetokenizerManager, Controller).
|
||||
processes (TokenizerManager, DetokenizerManager, Scheduler).
|
||||
"""
|
||||
|
||||
import copy
|
||||
import uuid
|
||||
from dataclasses import dataclass, field
|
||||
from enum import Enum
|
||||
from typing import TYPE_CHECKING, Any, Dict, List, Optional, Set, Union
|
||||
from typing import TYPE_CHECKING, Any, Dict, List, Optional, Union
|
||||
|
||||
from sglang.srt.managers.schedule_batch import BaseFinishReason
|
||||
from sglang.srt.multimodal.mm_utils import has_valid_data
|
||||
@@ -545,7 +545,7 @@ class EmbeddingReqInput:
|
||||
# The request id.
|
||||
rid: Optional[Union[List[str], str]] = None
|
||||
# Dummy sampling params for compatibility
|
||||
sampling_params: Union[List[Dict], Dict] = None
|
||||
sampling_params: Optional[Union[List[Dict], Dict]] = None
|
||||
# Dummy input embeds for compatibility
|
||||
input_embeds: Optional[Union[List[List[List[float]]], List[List[float]]]] = None
|
||||
# Whether to log metrics for this request (e.g. health_generate calls do not log metrics)
|
||||
@@ -953,17 +953,6 @@ class ProfileReqType(Enum):
|
||||
STOP_PROFILE = 2
|
||||
|
||||
|
||||
class ExpertDistributionReq(Enum):
|
||||
START_RECORD = 1
|
||||
STOP_RECORD = 2
|
||||
DUMP_RECORD = 3
|
||||
|
||||
|
||||
@dataclass
|
||||
class ExpertDistributionReqOutput:
|
||||
pass
|
||||
|
||||
|
||||
@dataclass
|
||||
class ProfileReq:
|
||||
type: ProfileReqType
|
||||
@@ -1013,6 +1002,17 @@ class HealthCheckOutput:
|
||||
pass
|
||||
|
||||
|
||||
class ExpertDistributionReq(Enum):
|
||||
START_RECORD = 1
|
||||
STOP_RECORD = 2
|
||||
DUMP_RECORD = 3
|
||||
|
||||
|
||||
@dataclass
|
||||
class ExpertDistributionReqOutput:
|
||||
pass
|
||||
|
||||
|
||||
@dataclass
|
||||
class Function:
|
||||
description: Optional[str] = None
|
||||
|
||||
Reference in New Issue
Block a user