189 lines
6.0 KiB
Python
189 lines
6.0 KiB
Python
from typing import Literal, Optional
|
|
|
|
from pydantic import BaseModel, Field, model_validator
|
|
|
|
|
|
class PixelTarget(BaseModel):
|
|
mode: Literal["pixel"]
|
|
x: int
|
|
y: int
|
|
dx: int = 0
|
|
dy: int = 0
|
|
|
|
|
|
class GridTarget(BaseModel):
|
|
mode: Literal["grid"]
|
|
region_x: int
|
|
region_y: int
|
|
region_width: int = Field(gt=0)
|
|
region_height: int = Field(gt=0)
|
|
rows: int = Field(gt=0)
|
|
cols: int = Field(gt=0)
|
|
row: int = Field(ge=0)
|
|
col: int = Field(ge=0)
|
|
dx: float = 0.0
|
|
dy: float = 0.0
|
|
|
|
@model_validator(mode="after")
|
|
def _validate_indices(self):
|
|
if self.row >= self.rows or self.col >= self.cols:
|
|
raise ValueError("row/col must be inside rows/cols")
|
|
if not -1.0 <= self.dx <= 1.0:
|
|
raise ValueError("dx must be in [-1, 1]")
|
|
if not -1.0 <= self.dy <= 1.0:
|
|
raise ValueError("dy must be in [-1, 1]")
|
|
return self
|
|
|
|
|
|
Target = PixelTarget | GridTarget
|
|
|
|
|
|
class ActionRequest(BaseModel):
|
|
action: Literal[
|
|
"move",
|
|
"click",
|
|
"right_click",
|
|
"double_click",
|
|
"middle_click",
|
|
"scroll",
|
|
"type",
|
|
"hotkey",
|
|
"click_text",
|
|
]
|
|
target: Optional[Target] = None
|
|
duration_ms: int = Field(default=0, ge=0, le=20000)
|
|
button: Literal["left", "right", "middle"] = "left"
|
|
clicks: int = Field(default=1, ge=1, le=10)
|
|
scroll_amount: int = 0
|
|
text: str = ""
|
|
keys: list[str] = Field(default_factory=list)
|
|
interval_ms: int = Field(default=20, ge=0, le=5000)
|
|
dry_run: bool = False
|
|
click_text: "ClickTextAction | None" = None
|
|
|
|
@model_validator(mode="after")
|
|
def _validate_click_text(self):
|
|
if self.action == "click_text" and self.click_text is None:
|
|
raise ValueError("click_text payload is required when action=click_text")
|
|
return self
|
|
|
|
|
|
class ExecRequest(BaseModel):
|
|
command: str = Field(min_length=1, max_length=10000)
|
|
shell: Literal["powershell", "bash", "cmd"] | None = None
|
|
timeout_s: int | None = Field(default=None, ge=1, le=600)
|
|
cwd: str | None = None
|
|
dry_run: bool = False
|
|
|
|
|
|
class WindowQuery(BaseModel):
|
|
title_contains: str | None = Field(default=None, max_length=512)
|
|
title_regex: str | None = Field(default=None, max_length=512)
|
|
process_name: str | None = Field(default=None, max_length=260)
|
|
hwnd: int | None = Field(default=None, ge=1)
|
|
visible_only: bool = True
|
|
|
|
|
|
class WindowActionRequest(WindowQuery):
|
|
action: Literal["focus", "restore", "minimize", "maximize", "close"]
|
|
timeout_ms: int = Field(default=3000, ge=0, le=60000)
|
|
|
|
|
|
class LaunchRequest(BaseModel):
|
|
executable: str = Field(min_length=1, max_length=2048)
|
|
args: list[str] = Field(default_factory=list, max_length=100)
|
|
cwd: str | None = None
|
|
wait_for_window: bool = False
|
|
match: WindowQuery | None = None
|
|
timeout_ms: int = Field(default=5000, ge=0, le=120000)
|
|
dry_run: bool = False
|
|
|
|
|
|
class SeeRequest(BaseModel):
|
|
screen: int = 0
|
|
region_x: int | None = Field(default=None, ge=0)
|
|
region_y: int | None = Field(default=None, ge=0)
|
|
region_width: int | None = Field(default=None, gt=0)
|
|
region_height: int | None = Field(default=None, gt=0)
|
|
with_grid: bool = True
|
|
grid_rows: int = Field(default=12, ge=1, le=300)
|
|
grid_cols: int = Field(default=12, ge=1, le=300)
|
|
include_labels: bool = True
|
|
image_format: Literal["png", "jpeg"] = "png"
|
|
jpeg_quality: int = Field(default=85, ge=1, le=100)
|
|
ocr: bool = False
|
|
ocr_min_confidence: float = Field(default=0.0, ge=0.0, le=100.0)
|
|
ocr_lang: str = Field(default="eng", min_length=1, max_length=64)
|
|
ocr_psm: int | None = Field(default=None, ge=0, le=13)
|
|
|
|
|
|
class SeeZoomRequest(BaseModel):
|
|
screen: int = 0
|
|
center_x: int = Field(ge=0)
|
|
center_y: int = Field(ge=0)
|
|
width: int = Field(default=500, ge=10)
|
|
height: int = Field(default=350, ge=10)
|
|
with_grid: bool = True
|
|
grid_rows: int = Field(default=20, ge=1, le=300)
|
|
grid_cols: int = Field(default=20, ge=1, le=300)
|
|
include_labels: bool = True
|
|
image_format: Literal["png", "jpeg"] = "png"
|
|
jpeg_quality: int = Field(default=90, ge=1, le=100)
|
|
|
|
|
|
class InteractRequest(BaseModel):
|
|
screen: int = 0
|
|
action: ActionRequest
|
|
|
|
|
|
class OCRRegion(BaseModel):
|
|
x: int = Field(ge=0)
|
|
y: int = Field(ge=0)
|
|
width: int = Field(gt=0)
|
|
height: int = Field(gt=0)
|
|
|
|
|
|
class ClickTextAction(BaseModel):
|
|
text: str = Field(min_length=1, max_length=1000)
|
|
match: Literal["contains", "exact", "regex"] = "contains"
|
|
region: OCRRegion | None = None
|
|
screen: int | None = None
|
|
case_sensitive: bool = False
|
|
min_confidence: float = Field(default=0.0, ge=0.0, le=100.0)
|
|
occurrence: Literal["first", "best", "nth"] = "first"
|
|
nth: int | None = Field(default=None, ge=1, le=10000)
|
|
ocr_lang: str = Field(default="eng", min_length=1, max_length=64)
|
|
ocr_psm: int | None = Field(default=None, ge=0, le=13)
|
|
|
|
@model_validator(mode="after")
|
|
def _validate_nth(self):
|
|
if self.occurrence == "nth" and self.nth is None:
|
|
raise ValueError("nth is required when occurrence=nth")
|
|
if self.occurrence != "nth" and self.nth is not None:
|
|
raise ValueError("nth is only allowed when occurrence=nth")
|
|
return self
|
|
|
|
|
|
class VerifyOCRTextNearPoint(BaseModel):
|
|
type: Literal["ocr_text_near_point"]
|
|
text: str = Field(min_length=1, max_length=1000)
|
|
x: int = Field(ge=0)
|
|
y: int = Field(ge=0)
|
|
radius: int = Field(default=80, ge=1, le=1000)
|
|
screen: int = 0
|
|
match: Literal["contains", "exact", "regex"] = "contains"
|
|
case_sensitive: bool = False
|
|
min_confidence: float = Field(default=0.0, ge=0.0, le=100.0)
|
|
ocr_lang: str = Field(default="eng", min_length=1, max_length=64)
|
|
ocr_psm: int | None = Field(default=None, ge=0, le=13)
|
|
|
|
|
|
class InteractVerifyRequest(BaseModel):
|
|
action: InteractRequest
|
|
verify: VerifyOCRTextNearPoint
|
|
check_interval_ms: int = Field(default=250, ge=50, le=5000)
|
|
timeout_ms: int = Field(default=3000, ge=100, le=60000)
|
|
|
|
|
|
ActionRequest.model_rebuild()
|