Compare commits
4 Commits
e5b3ea8b57
...
main
Author | SHA1 | Date | |
---|---|---|---|
6b13586154 | |||
7192f4bc18 | |||
36cfeffe9c | |||
7f5296b2ef |
@@ -45,10 +45,11 @@ def perform_ocr(screenshot: bytes) -> list[dict]:
|
|||||||
for i in range(n):
|
for i in range(n):
|
||||||
text = data['text'][i]
|
text = data['text'][i]
|
||||||
if text and text.strip():
|
if text and text.strip():
|
||||||
|
# Fix the center-point calculation (add first, then divide)
|
||||||
results.append({
|
results.append({
|
||||||
'text': text,
|
'text': text,
|
||||||
'x': data['width'][i] + data['left'][i] // 2, # center x position
|
'x': data['left'][i] + data['width'][i] // 2,
|
||||||
'y': data['height'][i] + data['top'][i] // 2 # center y position
|
'y': data['top'][i] + data['height'][i] // 2
|
||||||
})
|
})
|
||||||
|
|
||||||
# check if debug is enabled
|
# check if debug is enabled
|
||||||
@@ -109,7 +110,7 @@ def wait(duration: float) -> None:
|
|||||||
def search_pc(query: str) -> None:
|
def search_pc(query: str) -> None:
|
||||||
"""Presses the Windows key."""
|
"""Presses the Windows key."""
|
||||||
pyautogui.hotkey('win')
|
pyautogui.hotkey('win')
|
||||||
wait(2)
|
wait(4)
|
||||||
press_keyboard(KeyboardInput(text=query))
|
press_keyboard(KeyboardInput(text=query))
|
||||||
|
|
||||||
def reprompt(nextsteps: str, processor) -> None:
|
def reprompt(nextsteps: str, processor) -> None:
|
||||||
|
@@ -117,7 +117,7 @@ class AIProcessor:
|
|||||||
self.session.messages.append(
|
self.session.messages.append(
|
||||||
aic.Message(
|
aic.Message(
|
||||||
role="assistant",
|
role="assistant",
|
||||||
content=str(tool_calls),
|
content=str(((tc.function.name, tc.function.arguments) for tc in tool_calls)),
|
||||||
)
|
)
|
||||||
)
|
)
|
||||||
|
|
||||||
@@ -135,7 +135,7 @@ class AIProcessor:
|
|||||||
output_text: str = response.choices[0].message.content # type: ignore
|
output_text: str = response.choices[0].message.content # type: ignore
|
||||||
outputs.append(output_text)
|
outputs.append(output_text)
|
||||||
self.session.messages.append(
|
self.session.messages.append(
|
||||||
aic.Message(role="assistant", content=output_text)
|
aic.Message(role="assistant", content="Executed: " + (str(*outputs)))
|
||||||
)
|
)
|
||||||
|
|
||||||
return [*outputs]
|
return [*outputs]
|
||||||
|
@@ -31,7 +31,7 @@ FUNCTIONS = [
|
|||||||
"click_type": {
|
"click_type": {
|
||||||
"type": "string",
|
"type": "string",
|
||||||
"enum": ["left", "double_left", "middle", "right"],
|
"enum": ["left", "double_left", "middle", "right"],
|
||||||
"description": "The type of mouse click to perform. `double_left` is a double click."
|
"description": "The type of mouse click to perform. `double_left` is a double click, used to open apps or files."
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"required": ["click_type", "x", "y"],
|
"required": ["click_type", "x", "y"],
|
||||||
|
Reference in New Issue
Block a user