[PD] Fix edge case and simplify large page size + chunked prefill (#5589)
This commit is contained in:
@@ -1,4 +1,4 @@
|
||||
prompt = "Hello " * 16000
|
||||
prompt = [0] * 431
|
||||
|
||||
import json
|
||||
|
||||
@@ -6,8 +6,8 @@ import requests
|
||||
|
||||
response = requests.post(
|
||||
"http://0.0.0.0:8000/generate",
|
||||
json={"text": prompt, "sampling_params": {"temperature": 0}},
|
||||
json={"input_ids": [prompt] * 32, "sampling_params": {"temperature": 0}},
|
||||
)
|
||||
|
||||
|
||||
print("Response content (raw):", response.content)
|
||||
# print("Response content (raw):", response.content)
|
||||
|
||||
Reference in New Issue
Block a user