初始化项目,由ModelHub XC社区提供模型
Model: seopbo/rlvrmulti-qwen2.5-1.5b Source: Original Platform
This commit is contained in:
16
eval-results/ifeval/metrics.json
Normal file
16
eval-results/ifeval/metrics.json
Normal file
@@ -0,0 +1,16 @@
|
||||
{
|
||||
"ifeval": {
|
||||
"pass@1": {
|
||||
"num_prompts": 541,
|
||||
"num_instructions": 834,
|
||||
"average_score": 69.8299955229901,
|
||||
"prompt_strict_accuracy": 63.95563770794824,
|
||||
"instruction_strict_accuracy": 72.78177458033574,
|
||||
"prompt_loose_accuracy": 67.28280961182995,
|
||||
"instruction_loose_accuracy": 75.29976019184652,
|
||||
"num_entries": 541,
|
||||
"avg_tokens": 492,
|
||||
"gen_seconds": 26
|
||||
}
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user