minor: support specifying local dataset path for gsm8k and hellaswag (#2816)

This commit is contained in:
sleepcoo
2025-01-09 22:24:42 +08:00
committed by GitHub
parent 679c3bcacf
commit 4f077c01b8
2 changed files with 10 additions and 4 deletions

View File

@@ -1,6 +1,7 @@
import argparse
import ast
import json
import os
import re
import time
@@ -46,9 +47,11 @@ def main(args):
set_default_backend(select_sglang_backend(args))
# Read data
data_path = args.data_path
url = "https://raw.githubusercontent.com/openai/grade-school-math/master/grade_school_math/data/test.jsonl"
filename = download_and_cache_file(url)
lines = list(read_jsonl(filename))
if not os.path.isfile(data_path):
data_path = download_and_cache_file(url)
lines = list(read_jsonl(data_path))
# Construct prompts
num_questions = args.num_questions

View File

@@ -1,5 +1,6 @@
import argparse
import json
import os
import time
import numpy as np
@@ -31,9 +32,11 @@ def main(args):
set_default_backend(select_sglang_backend(args))
# Read data
data_path = args.data_path
url = "https://raw.githubusercontent.com/rowanz/hellaswag/master/data/hellaswag_val.jsonl"
filename = download_and_cache_file(url)
lines = list(read_jsonl(filename))
if not os.path.isfile(data_path):
data_path = download_and_cache_file(url)
lines = list(read_jsonl(data_path))
# Construct prompts
num_questions = args.num_questions