Files
xc-llm-kunlun/ci/scripts/tests/run_accuracy.sh

24 lines
523 B
Bash
Raw Permalink Normal View History

#!/usr/bin/env bash
set -euo pipefail
source ci/scripts/common/env.sh
source ci/scripts/common/log.sh
log "Running accuracy test via evalscope"
docker exec "${DOCKER_NAME}" bash -lc "
set -e
rm -f ${ACC_LOG}
export http_proxy=${PROXY_URL}
export https_proxy=${PROXY_URL}
export NO_PROXY=${NO_PROXY_LIST}
export no_proxy=${NO_PROXY_LIST}
evalscope eval \
--model ${SERVED_MODEL_NAME} \
--api-url http://localhost:${VLLM_PORT}/v1 \
--datasets gsm8k arc \
--limit 10 2>&1 | tee ${ACC_LOG}
"