Added example for multimodal embedding (#4206)

Co-authored-by: Chayenne <zhaochen20@outlook.com>
This commit is contained in:
simveit
2025-03-10 08:53:56 +01:00
committed by GitHub
parent 4455b26e76
commit 007f8b3dc2
2 changed files with 63 additions and 0 deletions

View File

@@ -0,0 +1,21 @@
# launch server
# python -m sglang.launch_server --model-path Alibaba-NLP/gme-Qwen2-VL-2B-Instruct --is-embedding --chat-template gme-qwen2-vl
import requests
url = "http://127.0.0.1:30000"
text_input = "Represent this image in embedding space."
image_path = "https://huggingface.co/datasets/liuhaotian/llava-bench-in-the-wild/resolve/main/images/023.jpg"
payload = {
"model": "gme-qwen2-vl",
"input": [
{"type": "text", "text": text_input},
{"type": "image", "url": image_path},
],
}
response = requests.post(url + "/v1/embeddings", json=payload).json()
print("Embeddings:", [x.get("embedding") for x in response.get("data", [])])