add avg latency

This commit is contained in:
2025-09-03 12:06:44 +08:00
parent 0010e9586b
commit 4363025bde

View File

@@ -74,6 +74,7 @@ def main():
# 两两相似度(余弦)——已归一化则点积即余弦
similarity = embeddings @ embeddings.T
avg_latency = encode_time / len(sentences) if sentences else 0
# 组织输出
result = {
@@ -81,7 +82,8 @@ def main():
"device": device,
"count": len(sentences),
"dim": int(embeddings.shape[1]) if len(embeddings.shape) == 2 else None,
"encode_time_seconds": round(float(encode_time), 6),
"total_elapsed_seconds": round(float(encode_time), 6),
"avg_latency": avg_latency,
"sentences": sentences,
"embeddings": embeddings.tolist(), # [N, D]
"similarity": similarity.tolist() # [N, N]