#590 Increase default , track changes in examples and documentation (#971)

Co-authored-by: Ying Sheng <sqy1415@gmail.com>
This commit is contained in:
foszto
2024-08-08 02:54:46 +02:00
committed by GitHub
parent 2b8257f325
commit c62d560c03
6 changed files with 10 additions and 10 deletions

View File

@@ -33,7 +33,7 @@ The `sampling_params` follows this format
```python
# The maximum number of output tokens
max_new_tokens: int = 16,
max_new_tokens: int = 128,
# Stop when hitting any of the strings in this list.
stop: Optional[Union[str, List[str]]] = None,
# Sampling temperature
@@ -90,7 +90,7 @@ response = requests.post(
"text": "The capital of France is",
"sampling_params": {
"temperature": 0,
"max_new_tokens": 256,
"max_new_tokens": 32,
},
"stream": True,
},

View File

@@ -125,7 +125,7 @@ class CompiledFunction:
def run(
self,
*,
max_new_tokens: int = 16,
max_new_tokens: int = 128,
stop: Union[str, List[str]] = (),
temperature: float = 1.0,
top_p: float = 1.0,
@@ -155,7 +155,7 @@ class CompiledFunction:
self,
batch_kwargs,
*,
max_new_tokens: int = 16,
max_new_tokens: int = 128,
stop: Union[str, List[str]] = (),
temperature: float = 1.0,
top_p: float = 1.0,

View File

@@ -16,7 +16,7 @@ REGEX_STRING = r"\"[\w\d\s]*\"" # bugs with regex r"\".*\"" in interegular pkg
@dataclasses.dataclass
class SglSamplingParams:
max_new_tokens: int = 16
max_new_tokens: int = 128
stop: Union[str, List[str]] = ()
temperature: float = 1.0
top_p: float = 1.0
@@ -140,7 +140,7 @@ class SglFunction:
def run(
self,
*args,
max_new_tokens: int = 16,
max_new_tokens: int = 128,
stop: Union[str, List[str]] = (),
temperature: float = 1.0,
top_p: float = 1.0,
@@ -179,7 +179,7 @@ class SglFunction:
self,
batch_kwargs,
*,
max_new_tokens: int = 16,
max_new_tokens: int = 128,
stop: Union[str, List[str]] = (),
temperature: float = 1.0,
top_p: float = 1.0,

View File

@@ -23,7 +23,7 @@ _SAMPLING_EPS = 1e-6
class SamplingParams:
def __init__(
self,
max_new_tokens: int = 16,
max_new_tokens: int = 128,
stop: Optional[Union[str, List[str]]] = None,
temperature: float = 1.0,
top_p: float = 1.0,

View File

@@ -3,7 +3,7 @@ curl http://localhost:30000/generate \
-d '{
"text": "Once upon a time,",
"sampling_params": {
"max_new_tokens": 16,
"max_new_tokens": 64,
"temperature": 0
}
}'

View File

@@ -36,7 +36,7 @@ async def test_concurrent(args):
"image_data": "example_image.png",
"sampling_params": {
"temperature": 0,
"max_new_tokens": 16,
"max_new_tokens": 64,
},
},
)