sglang/examples/frontend_language/quick_start/openai_example_chat.py

"""
Usage:
export OPENAI_API_KEY=sk-******
python3 openai_example_chat.py
"""

import sglang as sgl


@sgl.function
def multi_turn_question(s, question_1, question_2):
    s += sgl.system("You are a helpful assistant.")
    s += sgl.user(question_1)
    s += sgl.assistant(sgl.gen("answer_1", max_tokens=256))
    s += sgl.user(question_2)
    s += sgl.assistant(sgl.gen("answer_2", max_tokens=256))


def single():
    state = multi_turn_question.run(
        question_1="What is the capital of the United States?",
        question_2="List two local attractions.",
    )

    for m in state.messages():
        print(m["role"], ":", m["content"])

    print("\n-- answer_1 --\n", state["answer_1"])


def stream():
    state = multi_turn_question.run(
        question_1="What is the capital of the United States?",
        question_2="List two local attractions.",
        stream=True,
    )

    for out in state.text_iter():
        print(out, end="", flush=True)
    print()


def batch():
    states = multi_turn_question.run_batch(
        [
            {
                "question_1": "What is the capital of the United States?",
                "question_2": "List two local attractions.",
            },
            {
                "question_1": "What is the capital of France?",
                "question_2": "What is the population of this city?",
            },
        ]
    )

    for s in states:
        print(s.messages())


if __name__ == "__main__":
    sgl.set_default_backend(sgl.OpenAI("gpt-3.5-turbo"))

    # Run a single request
    print("\n========== single ==========\n")
    single()

    # Stream output
    print("\n========== stream ==========\n")
    stream()

    # Run a batch of requests
    print("\n========== batch ==========\n")
    batch()
Update quick start examples (#120) 2024-01-30 04:29:32 -08:00			`"""`
			`Usage:`
			`export OPENAI_API_KEY=sk-******`
			`python3 openai_example_chat.py`
			`"""`
misc: add pre-commit config (#637) 2024-07-18 04:55:39 +10:00
Update quick start examples (#120) 2024-01-30 04:29:32 -08:00			`import sglang as sgl`
release initial code Co-authored-by: Ying Sheng <sqy1415@gmail.com> Co-authored-by: Liangsheng Yin <hnyls2002@gmail.com> Co-authored-by: Zhiqiang Xie <xiezhq@stanford.edu> Co-authored-by: parasol-aser <3848358+parasol-aser@users.noreply.github.com> Co-authored-by: LiviaSun <33578456+ChuyueSun@users.noreply.github.com> Co-authored-by: Cody Yu <hao.yu.cody@gmail.com> 2024-01-08 04:37:50 +00:00

Update quick start examples (#120) 2024-01-30 04:29:32 -08:00			`@sgl.function`
release initial code Co-authored-by: Ying Sheng <sqy1415@gmail.com> Co-authored-by: Liangsheng Yin <hnyls2002@gmail.com> Co-authored-by: Zhiqiang Xie <xiezhq@stanford.edu> Co-authored-by: parasol-aser <3848358+parasol-aser@users.noreply.github.com> Co-authored-by: LiviaSun <33578456+ChuyueSun@users.noreply.github.com> Co-authored-by: Cody Yu <hao.yu.cody@gmail.com> 2024-01-08 04:37:50 +00:00			`def multi_turn_question(s, question_1, question_2):`
Update quick start examples (#120) 2024-01-30 04:29:32 -08:00			`s += sgl.system("You are a helpful assistant.")`
			`s += sgl.user(question_1)`
			`s += sgl.assistant(sgl.gen("answer_1", max_tokens=256))`
			`s += sgl.user(question_2)`
			`s += sgl.assistant(sgl.gen("answer_2", max_tokens=256))`
release initial code Co-authored-by: Ying Sheng <sqy1415@gmail.com> Co-authored-by: Liangsheng Yin <hnyls2002@gmail.com> Co-authored-by: Zhiqiang Xie <xiezhq@stanford.edu> Co-authored-by: parasol-aser <3848358+parasol-aser@users.noreply.github.com> Co-authored-by: LiviaSun <33578456+ChuyueSun@users.noreply.github.com> Co-authored-by: Cody Yu <hao.yu.cody@gmail.com> 2024-01-08 04:37:50 +00:00

Update quick start examples (#120) 2024-01-30 04:29:32 -08:00			`def single():`
			`state = multi_turn_question.run(`
			`question_1="What is the capital of the United States?",`
			`question_2="List two local attractions.",`
			`)`
release initial code Co-authored-by: Ying Sheng <sqy1415@gmail.com> Co-authored-by: Liangsheng Yin <hnyls2002@gmail.com> Co-authored-by: Zhiqiang Xie <xiezhq@stanford.edu> Co-authored-by: parasol-aser <3848358+parasol-aser@users.noreply.github.com> Co-authored-by: LiviaSun <33578456+ChuyueSun@users.noreply.github.com> Co-authored-by: Cody Yu <hao.yu.cody@gmail.com> 2024-01-08 04:37:50 +00:00
Update quick start examples (#120) 2024-01-30 04:29:32 -08:00			`for m in state.messages():`
			`print(m["role"], ":", m["content"])`

Add Together and AzureOpenAI examples (#184) 2024-02-12 01:06:38 -08:00			`print("\n-- answer_1 --\n", state["answer_1"])`
Update quick start examples (#120) 2024-01-30 04:29:32 -08:00

			`def stream():`
			`state = multi_turn_question.run(`
			`question_1="What is the capital of the United States?",`
			`question_2="List two local attractions.",`
misc: add pre-commit config (#637) 2024-07-18 04:55:39 +10:00			`stream=True,`
Update quick start examples (#120) 2024-01-30 04:29:32 -08:00			`)`

			`for out in state.text_iter():`
			`print(out, end="", flush=True)`
			`print()`


			`def batch():`
misc: add pre-commit config (#637) 2024-07-18 04:55:39 +10:00			`states = multi_turn_question.run_batch(`
			`[`
			`{`
			`"question_1": "What is the capital of the United States?",`
			`"question_2": "List two local attractions.",`
			`},`
			`{`
			`"question_1": "What is the capital of France?",`
			`"question_2": "What is the population of this city?",`
			`},`
			`]`
			`)`
Update quick start examples (#120) 2024-01-30 04:29:32 -08:00
			`for s in states:`
			`print(s.messages())`


			`if __name__ == "__main__":`
			`sgl.set_default_backend(sgl.OpenAI("gpt-3.5-turbo"))`

			`# Run a single request`
			`print("\n========== single ==========\n")`
			`single()`

			`# Stream output`
			`print("\n========== stream ==========\n")`
			`stream()`

			`# Run a batch of requests`
			`print("\n========== batch ==========\n")`
			`batch()`