Unverified Commit c62d560c authored by foszto's avatar foszto Committed by GitHub
Browse files

#590 Increase default , track changes in examples and documentation (#971)


Co-authored-by: default avatarYing Sheng <sqy1415@gmail.com>
parent 2b8257f3
......@@ -33,7 +33,7 @@ The `sampling_params` follows this format
```python
# The maximum number of output tokens
max_new_tokens: int = 16,
max_new_tokens: int = 128,
# Stop when hitting any of the strings in this list.
stop: Optional[Union[str, List[str]]] = None,
# Sampling temperature
......@@ -90,7 +90,7 @@ response = requests.post(
"text": "The capital of France is",
"sampling_params": {
"temperature": 0,
"max_new_tokens": 256,
"max_new_tokens": 32,
},
"stream": True,
},
......
......@@ -125,7 +125,7 @@ class CompiledFunction:
def run(
self,
*,
max_new_tokens: int = 16,
max_new_tokens: int = 128,
stop: Union[str, List[str]] = (),
temperature: float = 1.0,
top_p: float = 1.0,
......@@ -155,7 +155,7 @@ class CompiledFunction:
self,
batch_kwargs,
*,
max_new_tokens: int = 16,
max_new_tokens: int = 128,
stop: Union[str, List[str]] = (),
temperature: float = 1.0,
top_p: float = 1.0,
......
......@@ -16,7 +16,7 @@ REGEX_STRING = r"\"[\w\d\s]*\"" # bugs with regex r"\".*\"" in interegular pkg
@dataclasses.dataclass
class SglSamplingParams:
max_new_tokens: int = 16
max_new_tokens: int = 128
stop: Union[str, List[str]] = ()
temperature: float = 1.0
top_p: float = 1.0
......@@ -140,7 +140,7 @@ class SglFunction:
def run(
self,
*args,
max_new_tokens: int = 16,
max_new_tokens: int = 128,
stop: Union[str, List[str]] = (),
temperature: float = 1.0,
top_p: float = 1.0,
......@@ -179,7 +179,7 @@ class SglFunction:
self,
batch_kwargs,
*,
max_new_tokens: int = 16,
max_new_tokens: int = 128,
stop: Union[str, List[str]] = (),
temperature: float = 1.0,
top_p: float = 1.0,
......
......@@ -23,7 +23,7 @@ _SAMPLING_EPS = 1e-6
class SamplingParams:
def __init__(
self,
max_new_tokens: int = 16,
max_new_tokens: int = 128,
stop: Optional[Union[str, List[str]]] = None,
temperature: float = 1.0,
top_p: float = 1.0,
......
......@@ -3,7 +3,7 @@ curl http://localhost:30000/generate \
-d '{
"text": "Once upon a time,",
"sampling_params": {
"max_new_tokens": 16,
"max_new_tokens": 64,
"temperature": 0
}
}'
......@@ -36,7 +36,7 @@ async def test_concurrent(args):
"image_data": "example_image.png",
"sampling_params": {
"temperature": 0,
"max_new_tokens": 16,
"max_new_tokens": 64,
},
},
)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment