Compare commits

...

4 Commits

3 changed files with 7 additions and 6 deletions

View File

@@ -45,10 +45,11 @@ def perform_ocr(screenshot: bytes) -> list[dict]:
for i in range(n): for i in range(n):
text = data['text'][i] text = data['text'][i]
if text and text.strip(): if text and text.strip():
# Fix the center-point calculation (add first, then divide)
results.append({ results.append({
'text': text, 'text': text,
'x': data['width'][i] + data['left'][i] // 2, # center x position 'x': data['left'][i] + data['width'][i] // 2,
'y': data['height'][i] + data['top'][i] // 2 # center y position 'y': data['top'][i] + data['height'][i] // 2
}) })
# check if debug is enabled # check if debug is enabled
@@ -109,7 +110,7 @@ def wait(duration: float) -> None:
def search_pc(query: str) -> None: def search_pc(query: str) -> None:
"""Presses the Windows key.""" """Presses the Windows key."""
pyautogui.hotkey('win') pyautogui.hotkey('win')
wait(2) wait(4)
press_keyboard(KeyboardInput(text=query)) press_keyboard(KeyboardInput(text=query))
def reprompt(nextsteps: str, processor) -> None: def reprompt(nextsteps: str, processor) -> None:

View File

@@ -117,7 +117,7 @@ class AIProcessor:
self.session.messages.append( self.session.messages.append(
aic.Message( aic.Message(
role="assistant", role="assistant",
content=str(tool_calls), content=str(((tc.function.name, tc.function.arguments) for tc in tool_calls)),
) )
) )
@@ -135,7 +135,7 @@ class AIProcessor:
output_text: str = response.choices[0].message.content # type: ignore output_text: str = response.choices[0].message.content # type: ignore
outputs.append(output_text) outputs.append(output_text)
self.session.messages.append( self.session.messages.append(
aic.Message(role="assistant", content=output_text) aic.Message(role="assistant", content="Executed: " + (str(*outputs)))
) )
return [*outputs] return [*outputs]

View File

@@ -31,7 +31,7 @@ FUNCTIONS = [
"click_type": { "click_type": {
"type": "string", "type": "string",
"enum": ["left", "double_left", "middle", "right"], "enum": ["left", "double_left", "middle", "right"],
"description": "The type of mouse click to perform. `double_left` is a double click." "description": "The type of mouse click to perform. `double_left` is a double click, used to open apps or files."
} }
}, },
"required": ["click_type", "x", "y"], "required": ["click_type", "x", "y"],