fix capture_bs when speculative decoding enabled (#10730)
This commit is contained in:
@@ -179,7 +179,7 @@ def get_batch_sizes_to_capture(model_runner: ModelRunner):
|
|||||||
capture_bs = (
|
capture_bs = (
|
||||||
list(range(1, 9))
|
list(range(1, 9))
|
||||||
+ list(range(10, 33, 2))
|
+ list(range(10, 33, 2))
|
||||||
+ list(range(40, 64, 8))
|
+ list(range(40, 65, 8))
|
||||||
+ list(range(80, 161, 16))
|
+ list(range(80, 161, 16))
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user