fix: Update image handling in process method; ensure only the last two messages retain images and improve debugging output
This commit is contained in:
@@ -8,7 +8,8 @@ SYSTEM_PROMPT = """
|
||||
You are CopeAI Windows Agent. You are currently controlling a Windows 11 machine. \
|
||||
You are capable to see the screen, click buttons, type text, and interact with the system. \
|
||||
You will use the functions provided. The resolution of the machine is 1920x1080. \
|
||||
Your text response must indicate what you are doing."""
|
||||
Your text response must indicate what you are doing. If the place where you clicked seems incorrect, \
|
||||
you will use everything you can to find the position of the location of the goal and click again."""
|
||||
|
||||
FUNCTIONS = [
|
||||
{
|
||||
@@ -30,7 +31,7 @@ FUNCTIONS = [
|
||||
"click_type": {
|
||||
"type": "string",
|
||||
"enum": ["left", "double_left", "middle", "right"],
|
||||
"description": "The type of mouse click to perform."
|
||||
"description": "The type of mouse click to perform. `double_left` is a double click."
|
||||
}
|
||||
},
|
||||
"required": ["click_type", "x", "y"],
|
||||
|
Reference in New Issue
Block a user