[Feature] Support reward model LxzGordon/URM-LLaMa-3.1-8B (#1525)

This commit is contained in:
Ying Sheng
2024-09-27 23:32:11 -07:00
committed by GitHub
parent b1e330bcb0
commit 9aa6553d2a
13 changed files with 478 additions and 44 deletions

View File

@@ -73,7 +73,9 @@ class TestGenerationModels(unittest.TestCase):
max_new_tokens = 32
with HFRunner(
model_path, torch_dtype=torch_dtype, is_generation=True
model_path,
torch_dtype=torch_dtype,
model_type="generation",
) as hf_runner:
hf_outputs = hf_runner.forward(prompts, max_new_tokens=max_new_tokens)
@@ -81,7 +83,7 @@ class TestGenerationModels(unittest.TestCase):
model_path,
tp_size=model_case.tp_size,
torch_dtype=torch_dtype,
is_generation=True,
model_type="generation",
) as srt_runner:
srt_outputs = srt_runner.forward(prompts, max_new_tokens=max_new_tokens)