Improve code styles (#4021)
This commit is contained in:
@@ -238,120 +238,6 @@ class TokenizerMetricsCollector:
|
||||
],
|
||||
)
|
||||
|
||||
self.histogram_prefill_prealloc_duration = Histogram(
|
||||
name="sglang:prefill_prealloc_duration_seconds",
|
||||
documentation="Histogram of prefill prealloc duration in seconds.",
|
||||
labelnames=labels.keys(),
|
||||
buckets=[
|
||||
0.1,
|
||||
0.3,
|
||||
0.5,
|
||||
0.7,
|
||||
0.9,
|
||||
1,
|
||||
2,
|
||||
4,
|
||||
6,
|
||||
8,
|
||||
10,
|
||||
20,
|
||||
40,
|
||||
60,
|
||||
80,
|
||||
120,
|
||||
160,
|
||||
],
|
||||
)
|
||||
|
||||
self.histogram_prefill_queue_duration = Histogram(
|
||||
name="sglang:prefill_queue_duration_seconds",
|
||||
documentation="Histogram of prefill queue duration in seconds.",
|
||||
labelnames=labels.keys(),
|
||||
buckets=[
|
||||
0.1,
|
||||
0.3,
|
||||
0.5,
|
||||
0.7,
|
||||
0.9,
|
||||
2,
|
||||
4,
|
||||
8,
|
||||
16,
|
||||
64,
|
||||
],
|
||||
)
|
||||
|
||||
self.histogram_prefill_forward_duration = Histogram(
|
||||
name="sglang:prefill_forward_duration_seconds",
|
||||
documentation="Histogram of prefill forward duration in seconds.",
|
||||
labelnames=labels.keys(),
|
||||
buckets=[
|
||||
0.1,
|
||||
0.3,
|
||||
0.5,
|
||||
0.7,
|
||||
0.9,
|
||||
2,
|
||||
4,
|
||||
8,
|
||||
16,
|
||||
64,
|
||||
],
|
||||
)
|
||||
|
||||
self.histogram_prefill_transfer_duration = Histogram(
|
||||
name="sglang:prefill_transfer_duration_seconds",
|
||||
documentation="Histogram of prefill transfer duration in seconds.",
|
||||
labelnames=labels.keys(),
|
||||
buckets=[
|
||||
0.050,
|
||||
0.100,
|
||||
0.150,
|
||||
0.200,
|
||||
0.300,
|
||||
0.400,
|
||||
0.500,
|
||||
1.000,
|
||||
2.000,
|
||||
],
|
||||
)
|
||||
|
||||
self.histogram_decode_prealloc_duration = Histogram(
|
||||
name="sglang:decode_prealloc_duration_seconds",
|
||||
documentation="Histogram of decode prealloc duration in seconds.",
|
||||
labelnames=labels.keys(),
|
||||
buckets=[
|
||||
0.1,
|
||||
0.3,
|
||||
0.5,
|
||||
0.7,
|
||||
0.9,
|
||||
2,
|
||||
4,
|
||||
8,
|
||||
16,
|
||||
64,
|
||||
],
|
||||
)
|
||||
|
||||
self.histogram_decode_queue_duration = Histogram(
|
||||
name="sglang:decode_queue_duration_seconds",
|
||||
documentation="Histogram of decode queue duration in seconds.",
|
||||
labelnames=labels.keys(),
|
||||
buckets=[
|
||||
0.1,
|
||||
0.3,
|
||||
0.5,
|
||||
0.7,
|
||||
0.9,
|
||||
2,
|
||||
4,
|
||||
8,
|
||||
16,
|
||||
64,
|
||||
],
|
||||
)
|
||||
|
||||
def _log_histogram(self, histogram, data: Union[int, float]) -> None:
|
||||
histogram.labels(**self.labels).observe(data)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user