codespearhead · codespearhead · Apr 22, 2026 · Apr 22, 2026
diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
@@ -48,7 +48,7 @@ jobs:
               - 'Dockerfile'
               - '.github/workflows/ci.yml'
 
-  lint:
+  format_and_lint:
     timeout-minutes: 3
     runs-on: ubuntu-latest
 
@@ -95,7 +95,7 @@ jobs:
       - name: Install dependencies
         run: |
           source .venv/bin/activate
-          poetry install --no-root --with format
+          poetry install --no-root --with format,lint
 
       - name: Check for successful installation
         run: |
@@ -106,3 +106,8 @@ jobs:
         run: |
           source .venv/bin/activate
           poetry run python tasks/format.py --dry-run
+
+      - name: Format and lint project
+        run: |
+          source .venv/bin/activate
+          poetry run mypy
diff --git a/README.md b/README.md
@@ -129,3 +129,9 @@ poetry run pytest -rfsxE --capture=no --log-cli-level=DEBUG --maxfail=1 -vv ./te
 ```bash
 poetry run python ./tasks/format.py
 ```
+
+#### Code Linting
+
+```bash
+poetry run mypy
+```
diff --git a/poetry.lock b/poetry.lock
diff --git a/pyproject.toml b/pyproject.toml
@@ -24,13 +24,25 @@ test = [
 format = [
     "ruff (>=0.15.7,<0.16.0)"
 ]
+lint = [
+    "mypy (>=1.20.1,<2.0.0)",
+    "types-pynput (>=1.8.1.20260408,<2.0.0.0)",
+    "types-psutil (>=7.2.2.20260408,<8.0.0.0)"
+]
 
 
 [tool.poetry]
 packages = [
     { include = "visiongui", from = "src" }
 ]
 
+[tool.mypy]
+files = ["src"]
+mypy_path = 'src'
+explicit_package_bases = true
+strict = true
+exclude = '(\.venv|build|dist)'
+
 [build-system]
 requires = ["poetry-core>=2.0.0,<3.0.0"]
 build-backend = "poetry.core.masonry.api"
diff --git a/src/visiongui/__init__.py b/src/visiongui/__init__.py
diff --git a/src/visiongui/driver/DesktopDriverInterface.py b/src/visiongui/driver/DesktopDriverInterface.py
@@ -1,3 +1,4 @@
+import re
 import subprocess
 from abc import ABC, abstractmethod
 
@@ -11,11 +12,11 @@
 class DesktopDriverInterface(ABC):
     @property
     @abstractmethod
-    def process(self) -> subprocess.Popen | None: ...
+    def process(self) -> subprocess.Popen[bytes] | None: ...
 
     @process.setter
     @abstractmethod
-    def process(self, value: subprocess.Popen | None) -> None: ...
+    def process(self, value: subprocess.Popen[bytes] | None) -> None: ...
 
     @property
     @abstractmethod
@@ -26,22 +27,22 @@ def window(self) -> pywinctl.Window | None: ...
     def window(self, value: pywinctl.Window | None) -> None: ...
 
     @abstractmethod
-    def launch_process(self, *, cmd: list[str]) -> subprocess.Popen: ...
+    def launch_process(self, *, cmd: list[str]) -> subprocess.Popen[bytes]: ...
 
     @abstractmethod
     def find_window(
         self,
         *,
-        title,
-        timeout: float,
+        title: re.Pattern[str],
+        timeout: int,
     ) -> pywinctl.Window: ...
 
     @abstractmethod
     def wait_for_window_to_disappear(
         self,
         *,
-        title,
-        timeout: float,
+        title: re.Pattern[str],
+        timeout: int,
     ) -> None: ...
 
     @abstractmethod
@@ -59,10 +60,10 @@ def find_element_by_image(
         self,
         *,
         image_path: str,
-        timeout: float,
+        timeout: int,
         log_image_name: str,
-        margin_of_error: float,
-        time_held_stable_on_screen: float,
+        margin_of_error: int,
+        time_held_stable_on_screen: int,
         debug_output_base_path: str,
         match_with_color: bool = False,
     ) -> DesktopElementInterface: ...
diff --git a/src/visiongui/driver/DesktopDriverWindowsImplementation.py b/src/visiongui/driver/DesktopDriverWindowsImplementation.py
@@ -1,3 +1,4 @@
+import re
 import subprocess
 
 import pywinctl
@@ -19,16 +20,16 @@
 
 
 class DesktopDriverWindowsImplementation(DesktopDriverInterface):
-    def __init__(self):
-        self._process: subprocess.Popen | None = None
+    def __init__(self) -> None:
+        self._process: subprocess.Popen[bytes] | None = None
         self._window: pywinctl.Window | None = None
 
     @property
-    def process(self) -> subprocess.Popen | None:
+    def process(self) -> subprocess.Popen[bytes] | None:
         return self._process
 
     @process.setter
-    def process(self, value: subprocess.Popen | None) -> None:
+    def process(self, value: subprocess.Popen[bytes] | None) -> None:
         self._process = value
 
     @property
@@ -39,15 +40,15 @@ def window(self) -> pywinctl.Window | None:
     def window(self, value: pywinctl.Window | None) -> None:
         self._window = value
 
-    def launch_process(self, *, cmd: list[str]) -> subprocess.Popen:
+    def launch_process(self, *, cmd: list[str]) -> subprocess.Popen[bytes]:
         self.process = launch_process(cmd=cmd)
         return self.process
 
     def find_window(
         self,
         *,
-        title,
-        timeout: float,
+        title: re.Pattern[str],
+        timeout: int,
     ) -> pywinctl.Window:
         return find_window(
             title=title,
@@ -57,8 +58,8 @@ def find_window(
     def wait_for_window_to_disappear(
         self,
         *,
-        title,
-        timeout: float,
+        title: re.Pattern[str],
+        timeout: int,
     ) -> None:
         return wait_for_window_to_disappear(
             title=title,
@@ -69,10 +70,10 @@ def find_element_by_image(
         self,
         *,
         image_path: str,
-        timeout: float,
+        timeout: int,
         log_image_name: str,
-        margin_of_error: float,
-        time_held_stable_on_screen: float,
+        margin_of_error: int,
+        time_held_stable_on_screen: int,
         debug_output_base_path: str,
         match_with_color: bool = False,
     ) -> DesktopElementInterface:

diff --git a/src/visiongui/driver/close.py b/src/visiongui/driver/close.py
@@ -16,7 +16,11 @@ def close(
     if not isinstance(driver, DesktopDriverInterface):
         raise TypeError("Expected driver to be an instance of DesktopDriver")
 
-    pid = driver.window.getPID()
+    window = driver.window
+    pid = None
+    if window is not None:
+        pid = window.getPID()
+
     logger.debug(f"Forcefully killing process owning the window: {pid}")
     proc = psutil.Process(pid)
     proc.terminate()

diff --git a/src/visiongui/driver/find_element_by_image.py b/src/visiongui/driver/find_element_by_image.py
@@ -1,6 +1,7 @@
 import logging
 import os
 import time
+from typing import Callable
 
 import cv2
 import numpy as np
@@ -23,18 +24,22 @@
 logger = logging.getLogger(__name__)
 
 
-def _is_stable(get_current_location, timeout, time_held_stable_on_screen):
+def _is_stable(
+    get_current_location: Callable[[], DesktopElementImplementation | bool],
+    timeout: int,
+    time_held_stable_on_screen: int,
+) -> DesktopElementImplementation:
     start_time = time.time()
-    last_location = None
+    last_location: DesktopElementImplementation | None = None
     stable_start = None
     found_once = False
 
     while time.time() - start_time < timeout:
         current_location = get_current_location()
-        if current_location:
+        if isinstance(current_location, DesktopElementImplementation):
             found_once = True
             if (
-                last_location
+                last_location is not None
                 and current_location.top_left == last_location.top_left
                 and current_location.bottom_right == last_location.bottom_right
             ):
@@ -60,7 +65,13 @@ def _is_stable(get_current_location, timeout, time_held_stable_on_screen):
     raise ExceptionElementNotFound(timeout=timeout)
 
 
-def _match_template(template, margin_of_error, monitor, screen_image, mask=None):
+def _match_template(
+    template: np.ndarray,
+    margin_of_error: float,
+    monitor: dict[str, int],
+    screen_image: np.ndarray,
+    mask: np.ndarray | None = None,
+) -> DesktopElementImplementation | bool:
     # Ensure screen image has same number of channels as template
     if len(template.shape) == 2:
         if len(screen_image.shape) == 3:
@@ -109,18 +120,21 @@ def _match_template(template, margin_of_error, monitor, screen_image, mask=None)
 
 def find_element_by_image(
     image_path: str,
-    timeout: float,
+    timeout: int,
     log_image_name: str,
     debug_output_base_path: str,
     margin_of_error: float,
-    time_held_stable_on_screen: float,
+    time_held_stable_on_screen: int,
     match_with_color: bool = False,
 ) -> DesktopElementImplementation:
     if not image_path or not os.path.isfile(image_path):
         raise FileNotFoundError(f"Template image not found: {image_path}")
 
     # [68566fb0-e936-48e3-8c87-c5b8735567df] If the image has an alpha channel, extract it to build a binary mask. This mask ensures that only opaque regions of the template are matched, ignoring transparent padding.
     image = cv2.imread(image_path, cv2.IMREAD_UNCHANGED)
+    if image is None:
+        raise ValueError(f"Unable to read image at {image_path}")
+
     mask = None
     template = None
     if len(image.shape) == 3 and image.shape[2] == 4:
@@ -154,7 +168,7 @@ def find_element_by_image(
         with mss() as sct:
             monitor = sct.monitors[1]
 
-            def get_current_location():
+            def get_current_location() -> DesktopElementImplementation | bool:
                 screenshot = sct.grab(monitor)
                 screen_image = np.array(screenshot)
                 return _match_template(
@@ -173,10 +187,12 @@ def get_current_location():
                 )
                 return result
             try:
-                result = WebDriverWait(timeout).until(
+                wait_result = WebDriverWait(timeout).until(
                     condition=get_current_location,
                 )
-                return result
+                if not isinstance(wait_result, DesktopElementImplementation):
+                    raise ExceptionElementNotFound(timeout=timeout)
+                return wait_result
             except ExceptionTimeout:
                 save_debug_screenshot(
                     image_file_name_prefix=FileNamePrefix.FAIL,

diff --git a/src/visiongui/driver/find_window.py b/src/visiongui/driver/find_window.py
@@ -10,8 +10,8 @@
 logger = logging.getLogger(__name__)
 
 
-def _get_matching_window(title: re.Pattern) -> pywinctl.Window | None:
-    all_windows = pywinctl.getAllWindows()
+def _get_matching_window(title: re.Pattern[str]) -> pywinctl.Window | None:
+    all_windows = pywinctl.getAllWindows()  # type: ignore[no-untyped-call]
     titles = [window.title for window in all_windows if window.title.strip()]
     logger.debug(f"Checking all window titles: {titles}")
 
@@ -25,8 +25,8 @@ def _get_matching_window(title: re.Pattern) -> pywinctl.Window | None:
 
 
 def find_window(
-    title: re.Pattern,
-    timeout: float,
+    title: re.Pattern[str],
+    timeout: int,
 ) -> pywinctl.Window:
     def _window_check() -> pywinctl.Window | None:
         return _get_matching_window(title)

diff --git a/src/visiongui/driver/launch_process.py b/src/visiongui/driver/launch_process.py
@@ -2,7 +2,7 @@
 import subprocess
 
 
-def launch_process(cmd: list[str]) -> subprocess.Popen:
+def launch_process(cmd: list[str]) -> subprocess.Popen[bytes]:
     if not cmd:
         raise ValueError("Command list must not be empty")
 

diff --git a/src/visiongui/driver/save_debug_screenshot.py b/src/visiongui/driver/save_debug_screenshot.py
@@ -15,7 +15,7 @@ def save_debug_screenshot(
     image_file_name_prefix: FileNamePrefix,
     log_image_name: str,
     debug_output_base_path: str,
-):
+) -> None:
     file_binary = take_screenshot()
     file_name = f"{image_file_name_prefix.value}_{int(time.time())}_{os.path.basename(log_image_name)}.png"
     save_file(

diff --git a/src/visiongui/driver/switch_to.py b/src/visiongui/driver/switch_to.py
@@ -4,8 +4,11 @@
 
 
 def _set_foreground_hwnd(hwnd: int) -> None:
-    user32 = ctypes.WinDLL("user32", use_last_error=True)
-    kernel32 = ctypes.WinDLL("kernel32", use_last_error=True)
+    if platform.system() != "Windows":
+        raise RuntimeError("This function is only supported on Windows")
+
+    user32 = ctypes.WinDLL("user32", use_last_error=True)  # type: ignore[attr-defined]
+    kernel32 = ctypes.WinDLL("kernel32", use_last_error=True)  # type: ignore[attr-defined]
     GetForegroundWindow = user32.GetForegroundWindow
     GetWindowThreadProcessId = user32.GetWindowThreadProcessId
     GetCurrentThreadId = kernel32.GetCurrentThreadId

diff --git a/src/visiongui/driver/wait.py b/src/visiongui/driver/wait.py
@@ -1,18 +1,21 @@
 import time
 from collections.abc import Callable
+from typing import TypeVar
 
 from visiongui.driver.exception import ExceptionTimeout
 
+T = TypeVar("T")
+
 
 class WebDriverWait:
-    def __init__(self, timeout: float, poll_frequency: float = 0.1):
+    def __init__(self, timeout: int, poll_frequency: float = 0.1):
         self.timeout = timeout
         self.poll_frequency = poll_frequency
 
     def until(
         self,
-        condition: Callable[[], object],
-    ):
+        condition: Callable[[], T],
+    ) -> T:
         end_time = time.time() + self.timeout
         while True:
             try:

diff --git a/src/visiongui/driver/wait_for_window_to_disappear.py b/src/visiongui/driver/wait_for_window_to_disappear.py
@@ -11,8 +11,8 @@
 
 
 def wait_for_window_to_disappear(
-    title: re.Pattern,
-    timeout: float,
+    title: re.Pattern[str],
+    timeout: int,
 ) -> None:
     def _window_check() -> bool:
         return _get_matching_window(title) is None