初始化项目,由ModelHub XC社区提供模型
Model: Hcompany/Holo1.5-3B Source: Original Platform
This commit is contained in:
242
.eval_results/screenspot_pro.yaml
Normal file
242
.eval_results/screenspot_pro.yaml
Normal file
@@ -0,0 +1,242 @@
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: overall
|
||||
value: 51.5
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: android_studio_macos
|
||||
value: 50.0
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: autocad_windows
|
||||
value: 14.7
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: blender_windows
|
||||
value: 47.9
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: davinci_macos
|
||||
value: 54.5
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: eviews_windows
|
||||
value: 94.0
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: excel_macos
|
||||
value: 40.6
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: fruitloops_windows
|
||||
value: 42.1
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: illustrator_windows
|
||||
value: 19.4
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: inventor_windows
|
||||
value: 48.6
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: linux_common_linux
|
||||
value: 48.0
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: macos_common_macos
|
||||
value: 41.5
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: matlab_macos
|
||||
value: 66.7
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: origin_windows
|
||||
value: 27.4
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: photoshop_windows
|
||||
value: 51.0
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: powerpoint_windows
|
||||
value: 70.7
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: premiere_windows
|
||||
value: 42.3
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: pycharm_macos
|
||||
value: 55.1
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: quartus_windows
|
||||
value: 35.6
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: solidworks_windows
|
||||
value: 32.5
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: stata_windows
|
||||
value: 46.9
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: unreal_engine_windows
|
||||
value: 60.0
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: vivado_windows
|
||||
value: 71.2
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: vmware_macos
|
||||
value: 58.5
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: vscode_macos
|
||||
value: 56.4
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: windows_common_windows
|
||||
value: 32.1
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
|
||||
- dataset:
|
||||
id: likaixin/ScreenSpot-Pro
|
||||
task_id: word_macos
|
||||
value: 85.7
|
||||
source:
|
||||
url: https://gui-agent.github.io/grounding-leaderboard/
|
||||
name: ScreenSpot-Pro Leaderboard
|
||||
user: merve
|
||||
Reference in New Issue
Block a user