Optimize mem indices mangement (#619)

This commit is contained in:
Liangsheng Yin
2024-07-13 23:39:37 -07:00
committed by GitHub
parent 5d264a90ac
commit 564a898ad9
15 changed files with 251 additions and 178 deletions

View File

@@ -84,7 +84,7 @@ register_chat_template(
"system": ("SYSTEM:", "\n"),
"user": ("USER:", "\n"),
"assistant": ("ASSISTANT:", "\n"),
}
},
)
)
@@ -177,7 +177,7 @@ register_chat_template(
"assistant": ("", "<|im_end|>\n"),
},
style=ChatTemplateStyle.PLAIN,
stop_str=("<|im_end|>",)
stop_str=("<|im_end|>",),
)
)

View File

@@ -24,9 +24,9 @@ class SglSamplingParams:
presence_penalty: float = 0.0
ignore_eos: bool = False
return_logprob: Optional[bool] = None
logprob_start_len: Optional[int] = None,
top_logprobs_num: Optional[int] = None,
return_text_in_logprobs: Optional[bool] = None,
logprob_start_len: Optional[int] = (None,)
top_logprobs_num: Optional[int] = (None,)
return_text_in_logprobs: Optional[bool] = (None,)
# for constrained generation, not included in to_xxx_kwargs
dtype: Optional[str] = None