Update quick start examples (#120)

2024-01-30 04:29:32 -08:00
parent 4ea92f8307
commit 0617528632
20 changed files with 567 additions and 237 deletions
--- a/examples/quick_start/srt_example_chat.py
+++ b/examples/quick_start/srt_example_chat.py
@@ -1,26 +1,69 @@
-from sglang import function, system, user, assistant, gen, set_default_backend, Runtime
+"""
+Usage:
+python3 srt_example_chat.py
+"""
+import sglang as sgl


-@function
+@sgl.function
 def multi_turn_question(s, question_1, question_2):
-    s += system("You are a helpful assistant.")
-    s += user(question_1)
-    s += assistant(gen("answer_1", max_tokens=256))
-    s += user(question_2)
-    s += assistant(gen("answer_2", max_tokens=256))
+    s += sgl.user(question_1)
+    s += sgl.assistant(sgl.gen("answer_1", max_tokens=256))
+    s += sgl.user(question_2)
+    s += sgl.assistant(sgl.gen("answer_2", max_tokens=256))


-runtime = Runtime(model_path="meta-llama/Llama-2-7b-chat-hf")
-#runtime = Runtime(model_path="mistralai/Mixtral-8x7B-Instruct-v0.1")
-set_default_backend(runtime)
+def single():
+    state = multi_turn_question.run(
+        question_1="What is the capital of the United States?",
+        question_2="List two local attractions.",
+    )

-state = multi_turn_question.run(
-    question_1="What is the capital of the United States?",
-    question_2="List two local attractions.",
-)
+    for m in state.messages():
+        print(m["role"], ":", m["content"])

-for m in state.messages():
-    print(m["role"], ":", m["content"])
+    print("answer_1", state["answer_1"])


-runtime.shutdown()
+def stream():
+    state = multi_turn_question.run(
+        question_1="What is the capital of the United States?",
+        question_2="List two local attractions.",
+        stream=True
+    )
+
+    for out in state.text_iter():
+        print(out, end="", flush=True)
+    print()
+
+
+def batch():
+    states = multi_turn_question.run_batch([
+        {"question_1": "What is the capital of the United States?",
+         "question_2": "List two local attractions."},
+
+        {"question_1": "What is the capital of France?",
+         "question_2": "What is the population of this city?"},
+    ])
+
+    for s in states:
+        print(s.messages())
+
+
+if __name__ == "__main__":
+    runtime = sgl.Runtime(model_path="meta-llama/Llama-2-7b-chat-hf")
+    sgl.set_default_backend(runtime)
+
+    # Run a single request
+    print("\n========== single ==========\n")
+    single()
+
+    # Stream output
+    print("\n========== stream ==========\n")
+    stream()
+
+    # Run a batch of requests
+    print("\n========== batch ==========\n")
+    batch()
+
+    runtime.shutdown()