From eabcf82acb498505959b6539ef6810e30596ae52 Mon Sep 17 00:00:00 2001
From: Yineng Zhang <me@zhyncs.com>
Date: Sun, 18 May 2025 01:45:17 -0700
Subject: [PATCH] feat: add long context example (#6391)

---
 scripts/playground/long_context_example.py | 36 ++++++++++++++++++++++
 1 file changed, 36 insertions(+)
 create mode 100644 scripts/playground/long_context_example.py

diff --git a/scripts/playground/long_context_example.py b/scripts/playground/long_context_example.py
new file mode 100644
index 000000000..c5e035d29
--- /dev/null
+++ b/scripts/playground/long_context_example.py
@@ -0,0 +1,36 @@
+from urllib.request import urlopen
+
+from openai import OpenAI
+
+test_cases = {
+    "64k": "https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen2.5-1M/test-data/64k.txt",
+    "200k": "https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen2.5-1M/test-data/200k.txt",
+    "600k": "https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen2.5-1M/test-data/600k.txt",
+    "1m": "https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen2.5-1M/test-data/1m.txt",
+}
+
+client = OpenAI(api_key="EMPTY", base_url="http://127.0.0.1:30000/v1")
+
+for name, url in test_cases.items():
+    print(f"\n==== Running test case: {name} ====")
+    try:
+        with urlopen(url, timeout=10) as response:
+            prompt = response.read().decode("utf-8")
+    except Exception as e:
+        print(f"Failed to load prompt for {name}: {e}")
+        continue
+
+    try:
+        response = client.chat.completions.create(
+            model="meta-llama/Llama-4-Scout-17B-16E-Instruct",
+            messages=[{"role": "user", "content": prompt}],
+            stream=True,
+            max_tokens=128,
+            temperature=0,
+        )
+
+        for chunk in response:
+            if chunk.choices and chunk.choices[0].delta.content is not None:
+                print(chunk.choices[0].delta.content, end="", flush=True)
+    except Exception as e:
+        print(f"\nError during completion for {name}: {e}")