Improve benchmark scripts & rename some scripts (#477)
This commit is contained in:
@@ -88,6 +88,28 @@ def call_generate_srt_raw(prompt, temperature, max_tokens, stop=None, url=None):
|
||||
return pred
|
||||
|
||||
|
||||
def call_generate_xinfer(prompt, temperature, max_tokens, stop=None, url=None):
|
||||
import grpc
|
||||
from xlm.proto import sampler_pb2, sampler_pb2_grpc
|
||||
|
||||
sampler_channel = grpc.insecure_channel(url.replace("http://", ""))
|
||||
sampler = sampler_pb2_grpc.SamplerStub(sampler_channel)
|
||||
|
||||
sample_request = sampler_pb2.SampleTextRequest(
|
||||
prompt=prompt,
|
||||
settings=sampler_pb2.SampleSettings(
|
||||
max_len=max_tokens,
|
||||
rng_seed=0,
|
||||
temperature=max(temperature, 1e-7),
|
||||
nucleus_p=1,
|
||||
stop_strings=[stop],
|
||||
),
|
||||
)
|
||||
stream = sampler.SampleText(sample_request)
|
||||
response = "".join([x.text for x in stream])
|
||||
return response
|
||||
|
||||
|
||||
def call_generate_guidance(
|
||||
prompt, temperature, max_tokens, stop=None, n=1, regex=None, model=None
|
||||
):
|
||||
@@ -228,6 +250,7 @@ def add_common_other_args_and_parse(parser):
|
||||
"vllm",
|
||||
"outlines",
|
||||
"lightllm",
|
||||
"xinfer",
|
||||
"guidance",
|
||||
"lmql",
|
||||
"srt-raw",
|
||||
@@ -248,6 +271,7 @@ def add_common_other_args_and_parse(parser):
|
||||
"lightllm": 22000,
|
||||
"lmql": 23000,
|
||||
"srt-raw": 30000,
|
||||
"xinfer": 9988,
|
||||
}
|
||||
args.port = default_port.get(args.backend, None)
|
||||
return args
|
||||
@@ -283,6 +307,8 @@ def _get_call_generate(args):
|
||||
return partial(call_generate_vllm, url=f"{args.host}:{args.port}/generate")
|
||||
elif args.backend == "srt-raw":
|
||||
return partial(call_generate_srt_raw, url=f"{args.host}:{args.port}/generate")
|
||||
elif args.backend == "xinfer":
|
||||
return partial(call_generate_xinfer, url=f"{args.host}:{args.port}")
|
||||
elif args.backend == "outlines":
|
||||
return partial(call_generate_outlines, url=f"{args.host}:{args.port}/generate")
|
||||
elif args.backend == "guidance":
|
||||
|
||||
Reference in New Issue
Block a user