初始化项目,由ModelHub XC社区提供模型
Model: seopbo/rlvrcodemathif-qwen2.5-1.5b Source: Original Platform
This commit is contained in:
16
eval-results/ifbench/metrics.json
Normal file
16
eval-results/ifbench/metrics.json
Normal file
@@ -0,0 +1,16 @@
|
||||
{
|
||||
"ifbench": {
|
||||
"pass@1": {
|
||||
"num_prompts": 294,
|
||||
"num_instructions": 335,
|
||||
"average_score": 20.429739059803026,
|
||||
"prompt_strict_accuracy": 17.687074829931973,
|
||||
"instruction_strict_accuracy": 19.701492537313435,
|
||||
"prompt_loose_accuracy": 20.74829931972789,
|
||||
"instruction_loose_accuracy": 23.582089552238806,
|
||||
"num_entries": 294,
|
||||
"avg_tokens": 423,
|
||||
"gen_seconds": 51
|
||||
}
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user