Co-authored-by: Ying Sheng <sqy1415@gmail.com>
This commit is contained in:
@@ -33,7 +33,7 @@ The `sampling_params` follows this format
|
||||
|
||||
```python
|
||||
# The maximum number of output tokens
|
||||
max_new_tokens: int = 16,
|
||||
max_new_tokens: int = 128,
|
||||
# Stop when hitting any of the strings in this list.
|
||||
stop: Optional[Union[str, List[str]]] = None,
|
||||
# Sampling temperature
|
||||
@@ -90,7 +90,7 @@ response = requests.post(
|
||||
"text": "The capital of France is",
|
||||
"sampling_params": {
|
||||
"temperature": 0,
|
||||
"max_new_tokens": 256,
|
||||
"max_new_tokens": 32,
|
||||
},
|
||||
"stream": True,
|
||||
},
|
||||
|
||||
Reference in New Issue
Block a user