199 lines
4.7 KiB
YAML
199 lines
4.7 KiB
YAML
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: overall
|
|
value: 80.5
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: digital
|
|
value: 90.5
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: photographed
|
|
value: 77.2
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: latin
|
|
value: 81.7
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: de
|
|
value: 82.6
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: en
|
|
value: 87.4
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: es
|
|
value: 71.3
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: fr
|
|
value: 70.1
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: id
|
|
value: 84.5
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: it
|
|
value: 89.3
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: nl
|
|
value: 83.2
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: pt
|
|
value: 86.8
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: vi
|
|
value: 79.9
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: non_latin
|
|
value: 79.2
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: ar
|
|
value: 83.3
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: hi
|
|
value: 83.6
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: jp
|
|
value: 75.0
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: ko
|
|
value: 78.7
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: ru
|
|
value: 71.2
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: th
|
|
value: 77.9
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: zh
|
|
value: 84.6
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|
|
- dataset:
|
|
id: Delores-Lin/MDPBench
|
|
task_id: zh_t
|
|
value: 79.6
|
|
date: "2026-04-14"
|
|
source:
|
|
url: https://huggingface.co/datasets/Delores-Lin/MDPBench
|
|
name: MDPBench leaderboard
|
|
user: Delores-Lin
|