Fuse more ops & Simplify token mapping (#1758)

This commit is contained in:
Lianmin Zheng
2024-10-22 23:20:43 -07:00
committed by GitHub
parent 17536e7e3d
commit ad4125d1a9
9 changed files with 99 additions and 75 deletions

View File

@@ -67,6 +67,7 @@ def run_eval(args):
model=args.model,
max_tokens=2048,
base_url=base_url,
temperature=getattr(args, "temperature", 0.0),
)
# Run eval
@@ -119,6 +120,7 @@ if __name__ == "__main__":
parser.add_argument("--eval-name", type=str, default="mmlu")
parser.add_argument("--num-examples", type=int)
parser.add_argument("--num-threads", type=int, default=512)
parser.add_argument("--temperature", type=float, default=0.0)
args = parser.parse_args()
run_eval(args)