Use a single workspace for flashinfer (#1077)
This commit is contained in:
@@ -64,7 +64,7 @@ def main(args):
|
||||
@sgl.function
|
||||
def few_shot_gsm8k(s, question):
|
||||
s += few_shot_examples + question
|
||||
s += sgl.gen("answer", max_tokens=512, stop="Question")
|
||||
s += sgl.gen("answer", max_tokens=512, stop=["Question", "Assistant:"])
|
||||
|
||||
#####################################
|
||||
########## SGL Program End ##########
|
||||
|
||||
Reference in New Issue
Block a user