Holo1.5-3B / .eval_results /screenspot_pro.yaml
marc-thibault-h's picture
Add ScreenSpot-Pro evaluation result (Holo1.5-3B) (#3)
f10805d
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: overall
value: 51.5
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: android_studio_macos
value: 50.0
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: autocad_windows
value: 14.7
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: blender_windows
value: 47.9
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: davinci_macos
value: 54.5
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: eviews_windows
value: 94.0
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: excel_macos
value: 40.6
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: fruitloops_windows
value: 42.1
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: illustrator_windows
value: 19.4
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: inventor_windows
value: 48.6
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: linux_common_linux
value: 48.0
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: macos_common_macos
value: 41.5
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: matlab_macos
value: 66.7
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: origin_windows
value: 27.4
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: photoshop_windows
value: 51.0
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: powerpoint_windows
value: 70.7
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: premiere_windows
value: 42.3
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: pycharm_macos
value: 55.1
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: quartus_windows
value: 35.6
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: solidworks_windows
value: 32.5
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: stata_windows
value: 46.9
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: unreal_engine_windows
value: 60.0
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: vivado_windows
value: 71.2
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: vmware_macos
value: 58.5
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: vscode_macos
value: 56.4
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: windows_common_windows
value: 32.1
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve
- dataset:
id: likaixin/ScreenSpot-Pro
task_id: word_macos
value: 85.7
source:
url: https://gui-agent.github.io/grounding-leaderboard/
name: ScreenSpot-Pro Leaderboard
user: merve