-
Notifications
You must be signed in to change notification settings - Fork 5
/
Copy pathtest_guithinker_custom.py
128 lines (98 loc) · 4.56 KB
/
test_guithinker_custom.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
import os
import copy
import time
import json
import glob
import shutil
import argparse
import subprocess
from agent.autopc import AutoPC
from agent.utils.gui_capture import get_screenshot, focus_software
from agent.gui_parser.sender import send_gui_parser_request
from agent.actor.utils import format_gui, compress_gui
from agent.config import basic_config
def main():
parser = argparse.ArgumentParser(description="GUI-Thinker Locally Running")
parser.add_argument("--software_name", type=str, default="PowerPoint")
parser.add_argument("--userquery", type=str, default="Set the transitions of the second ppt to Push")
parser.add_argument("--projectID", type=str, default="000", help="The ID of current task")
parser.add_argument("--projfile_path", type=str, default="data/project_files/300. PowerPoint Applying Transitions/project.pptx", help="the file ready to operate")
parser.add_argument("--maximum_step", type=int, default=20, help="total steps")
parser.add_argument("--max_critic_trials", type=int, default=3, help="set the maiximum trials of critic times")
args = parser.parse_args()
saved_folder = 'test_results/%s'%(basic_config['planner_critic']['lmm'])
software_name = args.software_name
video_path = "" # leave it blank
projectID = args.projectID
query = args.userquery
projfile_path = args.projfile_path
subprocess.Popen([projfile_path], shell=True)
time.sleep(2)
maximum_step = args.maximum_step
max_critic_trials = args.max_critic_trials
## initialize the parameters
state = '<Continue>'
code = ""
last_screenshot_path = ""
critic_count = 0
autopc = AutoPC(software_name=software_name, project_id=projectID)
focus_software(software_name)
meta_data, screenshot_path = get_screenshot(software_name)
new_screenpath = os.path.join("%s"%(saved_folder), software_name, "%s_start.png"%(projectID))
print('Save result in', new_screenpath)
os.makedirs(os.path.dirname(new_screenpath), exist_ok=True)
shutil.copy(screenshot_path, new_screenpath)
gui_results = send_gui_parser_request(basic_config['gui_parser']['url'], software_name, screenshot_path, meta_data, task_id=projectID, step_id="1")
gui_info = compress_gui(copy.deepcopy(gui_results))
gui_info = "\n".join(format_gui(gui_info))
print('User Query:', query)
focus_software(software_name)
plan = autopc.run_planner(query, software_name, screenshot_path, gui_info, video_path)
print('Plan:\n', plan)
for idx in range(maximum_step):
meta_data, screenshot_path = get_screenshot(software_name)
print("===Current task===", "Index:", idx, state)
print(autopc.current_task.name.strip())
code, state, current_task = autopc.run_step(state,
code,
autopc.current_task,
meta_data,
last_screenshot_path,
screenshot_path,
software_name,
if_screenshot=True)
## execute the action code
if code != "":
focus_software(software_name)
exec(code)
last_screenshot_path = screenshot_path
if state == '<Continue>':
state = '<Critic>'
elif state == '<Next>':
autopc.current_task = autopc.current_task.next()
if autopc.current_task:
state = '<Continue>'
code = ""
critic_count = 0
else:
state = '<Finished>'
print("===Current task===", "Index:", idx, state)
break
if state == '<Critic>':
critic_count += 1
if critic_count > max_critic_trials:
autopc.current_task = autopc.current_task.next()
if autopc.current_task:
state = '<Continue>'
code = ""
critic_count = 0
else:
state = '<Finished>'
print('current index', idx, state)
break
new_screenpath = os.path.join("%s"%(saved_folder), software_name, "%s_end.png"%(projectID))
print('Save result in', new_screenpath)
os.makedirs(os.path.dirname(new_screenpath), exist_ok=True)
shutil.copy(screenshot_path, new_screenpath)
if __name__ == "__main__":
main()