forked from likaixin2000/ScreenSpot-Pro-GUI-Grounding
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathrun_ss_pro.sh
More file actions
executable file
·83 lines (76 loc) · 2.85 KB
/
run_ss_pro.sh
File metadata and controls
executable file
·83 lines (76 loc) · 2.85 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
#!/bin/bash
set -e
# English
models=("kimivl" "cogagent24" "ariaui" "uground" "osatlas-7b" "osatlas-4b" "showui" "seeclick" "qwen1vl" "qwen2vl" "minicpmv" "cogagent" "gpt4o" )
for model in "${models[@]}"
do
python eval_screenspot_pro_parallel.py \
--model_type ${model} \
--screenspot_imgs "../data/ScreenSpot-Pro/images" \
--screenspot_test "../data/ScreenSpot-Pro/annotations" \
--task "all" \
--language "en" \
--gt_type "positive" \
--log_path "./results/${model}.json" \
--inst_style "instruction" \
--num_gpu 7
done
# Qwen2.5-VL series
ckpts=("Qwen/Qwen2.5-VL-3B-Instruct" "Qwen/Qwen2.5-VL-7B-Instruct" "Qwen/Qwen2.5-VL-72B-Instruct")
for ckpt in "${ckpts[@]}"
do
python eval_screenspot_pro.py \
--model_type "qwen2_5vl" \
--model_name_or_path ${ckpt} \
--screenspot_imgs "../data/ScreenSpot-Pro/images" \
--screenspot_test "../data/ScreenSpot-Pro/annotations" \
--task "all" \
--language "en" \
--gt_type "positive" \
--log_path "./results/${ckpt}.json" \
--inst_style "instruction"
done
# Qwen3-VL series
ckpts=("Qwen/Qwen3-VL-2B-Instruct" "Qwen/Qwen3-VL-4B-Instruct" "Qwen/Qwen3-VL-8B-Instruct" "Qwen/Qwen3-VL-32B-Instruct" "Qwen/Qwen3-VL-30B-A3B-Instruct" "Qwen/Qwen3-VL-2B-Thinking" "Qwen/Qwen3-VL-4B-Thinking" "Qwen/Qwen3-VL-8B-Thinking" "Qwen/Qwen3-VL-32B-Thinking" "Qwen/Qwen3-VL-30B-A3B-Thinking")
for ckpt in "${ckpts[@]}"
do
python eval_screenspot_pro_parallel.py \
--model_type "qwen3vl" \
--model_name_or_path ${ckpt} \
--screenspot_imgs "../data/ScreenSpot-Pro/images" \
--screenspot_test "../data/ScreenSpot-Pro/annotations" \
--task "all" \
--language "en" \
--gt_type "positive" \
--log_path "./results/${ckpt}.json" \
--inst_style "instruction"
done
ckpts=("Qwen/Qwen3-VL-235B-A22B-Instruct" "Qwen/Qwen3-VL-235B-A22B-Thinking")
for ckpt in "${ckpts[@]}"
do
python eval_screenspot_pro_parallel.py \
--model_type "qwen3vl" \
--model_name_or_path ${ckpt} \
--screenspot_imgs "../data/ScreenSpot-Pro/images" \
--screenspot_test "../data/ScreenSpot-Pro/annotations" \
--task "all" \
--language "en" \
--gt_type "positive" \
--log_path "./results/${ckpt}.json" \
--inst_style "instruction"
done
# GPT-5
ckpts=("gpt-5-2025-08-07")
for ckpt in "${ckpts[@]}"
do
python eval_screenspot_pro_parallel.py \
--model_type "gpt5" \
--model_name_or_path ${ckpt} \
--screenspot_imgs "../data/ScreenSpot-Pro/images" \
--screenspot_test "../data/ScreenSpot-Pro/annotations" \
--task "all" \
--language "en" \
--gt_type "positive" \
--log_path "./results/${ckpt}.json" \
--inst_style "instruction"
done