[Refactor] Remove Hicache Load & Write threads (#10127)
Co-authored-by: Zhiqiang Xie <xiezhq@stanford.edu>
This commit is contained in:
@@ -911,7 +911,7 @@ class ScheduleBatch(ScheduleBatchDisaggregationDecodeMixin):
|
||||
is_prefill_only: bool = False
|
||||
|
||||
# hicache pointer for synchronizing data loading from CPU to GPU
|
||||
hicache_consumer_index: int = 0
|
||||
hicache_consumer_index: int = -1
|
||||
|
||||
@classmethod
|
||||
def init_new(
|
||||
@@ -1897,7 +1897,7 @@ class ModelWorkerBatch:
|
||||
spec_info: Optional[Union[EagleVerifyInput, EagleDraftInput]] = None
|
||||
# If set, the output of the batch contains the hidden states of the run.
|
||||
capture_hidden_mode: CaptureHiddenMode = None
|
||||
hicache_consumer_index: int = 0
|
||||
hicache_consumer_index: int = -1
|
||||
|
||||
# Overlap event
|
||||
launch_done: Optional[threading.Event] = None
|
||||
|
||||
Reference in New Issue
Block a user