[Feature] Support reward model LxzGordon/URM-LLaMa-3.1-8B (#1525)
This commit is contained in:
@@ -73,7 +73,9 @@ class TestGenerationModels(unittest.TestCase):
|
||||
max_new_tokens = 32
|
||||
|
||||
with HFRunner(
|
||||
model_path, torch_dtype=torch_dtype, is_generation=True
|
||||
model_path,
|
||||
torch_dtype=torch_dtype,
|
||||
model_type="generation",
|
||||
) as hf_runner:
|
||||
hf_outputs = hf_runner.forward(prompts, max_new_tokens=max_new_tokens)
|
||||
|
||||
@@ -81,7 +83,7 @@ class TestGenerationModels(unittest.TestCase):
|
||||
model_path,
|
||||
tp_size=model_case.tp_size,
|
||||
torch_dtype=torch_dtype,
|
||||
is_generation=True,
|
||||
model_type="generation",
|
||||
) as srt_runner:
|
||||
srt_outputs = srt_runner.forward(prompts, max_new_tokens=max_new_tokens)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user