Initial commit: GSPro Remote MVP - Phase 1 complete

2025-11-13 15:38:58 -06:00 · 2025-11-13 15:38:58 -06:00 · 74ca4b38eb
commit 74ca4b38eb
50 changed files with 12818 additions and 0 deletions
--- a/backend/app/core/screen.py
+++ b/backend/app/core/screen.py
@ -0,0 +1,370 @@
+"""
+Screen capture utilities for GSPro Remote.
+"""
+
+import logging
+from typing import Optional, Tuple, Dict, Any
+from io import BytesIO
+import base64
+
+try:
+    import mss
+    import mss.tools
+    from PIL import Image
+    import cv2
+    import numpy as np
+except ImportError as e:
+    raise ImportError(f"Required screen capture dependencies not installed: {e}")
+
+logger = logging.getLogger(__name__)
+
+
+class ScreenCapture:
+    """Manages screen capture operations."""
+
+    def __init__(self):
+        """Initialize screen capture manager."""
+        self.sct = mss.mss()
+        self._monitor_info = None
+
+    def get_monitors(self) -> list[dict]:
+        """
+        Get information about all available monitors.
+
+        Returns:
+            List of monitor information dictionaries
+        """
+        monitors = []
+        for i, monitor in enumerate(self.sct.monitors):
+            monitors.append(
+                {
+                    "index": i,
+                    "left": monitor["left"],
+                    "top": monitor["top"],
+                    "width": monitor["width"],
+                    "height": monitor["height"],
+                    "is_primary": i == 0,  # Index 0 is combined virtual screen
+                }
+            )
+        return monitors
+
+    def get_primary_monitor(self) -> dict:
+        """
+        Get the primary monitor information.
+
+        Returns:
+            Primary monitor information
+        """
+        # Index 1 is typically the primary monitor in mss
+        return self.sct.monitors[1] if len(self.sct.monitors) > 1 else self.sct.monitors[0]
+
+    def capture_screen(self, monitor_index: int = 1) -> np.ndarray:
+        """
+        Capture the entire screen.
+
+        Args:
+            monitor_index: Index of the monitor to capture (0 for all, 1 for primary)
+
+        Returns:
+            Captured screen as numpy array (BGR format)
+        """
+        try:
+            monitor = self.sct.monitors[monitor_index]
+            screenshot = self.sct.grab(monitor)
+
+            # Convert to numpy array (BGR format for OpenCV compatibility)
+            img = np.array(screenshot)
+            img = cv2.cvtColor(img, cv2.COLOR_RGBA2BGR)
+
+            return img
+        except Exception as e:
+            logger.error(f"Failed to capture screen: {e}")
+            raise
+
+    def capture_region(self, x: int, y: int, width: int, height: int, monitor_index: int = 1) -> np.ndarray:
+        """
+        Capture a specific region of the screen.
+
+        Args:
+            x: X coordinate of the region (relative to monitor)
+            y: Y coordinate of the region (relative to monitor)
+            width: Width of the region
+            height: Height of the region
+            monitor_index: Index of the monitor to capture from
+
+        Returns:
+            Captured region as numpy array (BGR format)
+        """
+        try:
+            monitor = self.sct.monitors[monitor_index]
+
+            # Define region to capture
+            region = {
+                "left": monitor["left"] + x,
+                "top": monitor["top"] + y,
+                "width": width,
+                "height": height,
+            }
+
+            screenshot = self.sct.grab(region)
+
+            # Convert to numpy array
+            img = np.array(screenshot)
+            img = cv2.cvtColor(img, cv2.COLOR_RGBA2BGR)
+
+            return img
+        except Exception as e:
+            logger.error(f"Failed to capture region: {e}")
+            raise
+
+    def capture_window(self, window_title: str) -> Optional[np.ndarray]:
+        """
+        Capture a specific window by title.
+
+        Args:
+            window_title: Title of the window to capture
+
+        Returns:
+            Captured window as numpy array or None if window not found
+        """
+        try:
+            import win32gui
+
+            def enum_window_callback(hwnd, windows):
+                if win32gui.IsWindowVisible(hwnd) and win32gui.IsWindowEnabled(hwnd):
+                    window_text = win32gui.GetWindowText(hwnd)
+                    if window_title.lower() in window_text.lower():
+                        windows.append(hwnd)
+                return True
+
+            windows = []
+            win32gui.EnumWindows(enum_window_callback, windows)
+
+            if not windows:
+                logger.warning(f"Window not found: {window_title}")
+                return None
+
+            # Get window rectangle
+            hwnd = windows[0]
+            rect = win32gui.GetWindowRect(hwnd)
+            x, y, x2, y2 = rect
+            width = x2 - x
+            height = y2 - y
+
+            # Capture the window region
+            return self.capture_region(x, y, width, height, monitor_index=0)
+
+        except Exception as e:
+            logger.error(f"Failed to capture window: {e}")
+            return None
+
+    def image_to_base64(self, image: np.ndarray, quality: int = 85, format: str = "JPEG") -> str:
+        """
+        Convert an image array to base64 string.
+
+        Args:
+            image: Image as numpy array (BGR format)
+            quality: JPEG quality (1-100)
+            format: Image format (JPEG, PNG)
+
+        Returns:
+            Base64 encoded image string
+        """
+        try:
+            # Convert BGR to RGB for PIL
+            rgb_image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+            pil_image = Image.fromarray(rgb_image)
+
+            # Save to bytes
+            buffer = BytesIO()
+            if format.upper() == "JPEG":
+                pil_image.save(buffer, format=format, quality=quality, optimize=True)
+            else:
+                pil_image.save(buffer, format=format)
+
+            # Encode to base64
+            buffer.seek(0)
+            base64_string = base64.b64encode(buffer.getvalue()).decode("utf-8")
+
+            return base64_string
+        except Exception as e:
+            logger.error(f"Failed to convert image to base64: {e}")
+            raise
+
+    def resize_image(self, image: np.ndarray, width: Optional[int] = None, height: Optional[int] = None) -> np.ndarray:
+        """
+        Resize an image while maintaining aspect ratio.
+
+        Args:
+            image: Image as numpy array
+            width: Target width (None to calculate from height)
+            height: Target height (None to calculate from width)
+
+        Returns:
+            Resized image as numpy array
+        """
+        try:
+            h, w = image.shape[:2]
+
+            if width and not height:
+                # Calculate height maintaining aspect ratio
+                height = int(h * (width / w))
+            elif height and not width:
+                # Calculate width maintaining aspect ratio
+                width = int(w * (height / h))
+            elif not width and not height:
+                # No resize needed
+                return image
+
+            return cv2.resize(image, (width, height), interpolation=cv2.INTER_AREA)
+        except Exception as e:
+            logger.error(f"Failed to resize image: {e}")
+            raise
+
+    def get_resolution_preset(self, preset: str) -> Tuple[int, int]:
+        """
+        Get width and height for a resolution preset.
+
+        Args:
+            preset: Resolution preset (e.g., '720p', '1080p', '480p')
+
+        Returns:
+            Tuple of (width, height)
+        """
+        presets = {
+            "480p": (854, 480),
+            "540p": (960, 540),
+            "720p": (1280, 720),
+            "900p": (1600, 900),
+            "1080p": (1920, 1080),
+            "1440p": (2560, 1440),
+            "2160p": (3840, 2160),
+            "4k": (3840, 2160),
+        }
+
+        return presets.get(preset.lower(), (1280, 720))
+
+    def close(self):
+        """Close the screen capture resources."""
+        if hasattr(self, "sct"):
+            self.sct.close()
+
+
+# Global screen capture instance
+_screen_capture: Optional[ScreenCapture] = None
+
+
+def get_screen_capture() -> ScreenCapture:
+    """
+    Get the global screen capture instance.
+
+    Returns:
+        ScreenCapture instance
+    """
+    global _screen_capture
+    if _screen_capture is None:
+        _screen_capture = ScreenCapture()
+    return _screen_capture
+
+
+def capture_screen(monitor_index: int = 1) -> np.ndarray:
+    """
+    Capture the entire screen.
+
+    Args:
+        monitor_index: Index of the monitor to capture
+
+    Returns:
+        Captured screen as numpy array
+    """
+    return get_screen_capture().capture_screen(monitor_index)
+
+
+def capture_region(x: int, y: int, width: int, height: int) -> np.ndarray:
+    """
+    Capture a specific region of the screen.
+
+    Args:
+        x: X coordinate of the region
+        y: Y coordinate of the region
+        width: Width of the region
+        height: Height of the region
+
+    Returns:
+        Captured region as numpy array
+    """
+    return get_screen_capture().capture_region(x, y, width, height)
+
+
+def get_screen_size() -> Tuple[int, int]:
+    """
+    Get the primary screen size.
+
+    Returns:
+        Tuple of (width, height)
+    """
+    monitor = get_screen_capture().get_primary_monitor()
+    return monitor["width"], monitor["height"]
+
+
+def capture_gspro_window(window_title: str = "GSPro") -> Optional[np.ndarray]:
+    """
+    Capture the GSPro window.
+
+    Args:
+        window_title: GSPro window title
+
+    Returns:
+        Captured window as numpy array or None if not found
+    """
+    return get_screen_capture().capture_window(window_title)
+
+
+# Test function for development
+def test_screen_capture():
+    """Test screen capture functionality."""
+    print("Testing screen capture...")
+
+    capture = ScreenCapture()
+
+    # Get monitor information
+    monitors = capture.get_monitors()
+    print(f"Found {len(monitors)} monitors:")
+    for monitor in monitors:
+        print(
+            f"  Monitor {monitor['index']}: {monitor['width']}x{monitor['height']} at ({monitor['left']}, {monitor['top']})"
+        )
+
+    # Capture primary screen
+    try:
+        screen = capture.capture_screen()
+        print(f"✓ Captured primary screen: {screen.shape}")
+    except Exception as e:
+        print(f"✗ Failed to capture screen: {e}")
+
+    # Test region capture
+    try:
+        region = capture.capture_region(100, 100, 640, 480)
+        print(f"✓ Captured region: {region.shape}")
+    except Exception as e:
+        print(f"✗ Failed to capture region: {e}")
+
+    # Test image to base64 conversion
+    try:
+        base64_str = capture.image_to_base64(region)
+        print(f"✓ Converted to base64: {len(base64_str)} chars")
+    except Exception as e:
+        print(f"✗ Failed to convert to base64: {e}")
+
+    # Test resolution presets
+    presets = ["480p", "720p", "1080p"]
+    for preset in presets:
+        width, height = capture.get_resolution_preset(preset)
+        print(f"  {preset}: {width}x{height}")
+
+    capture.close()
+    print("\nScreen capture test complete!")
+
+
+if __name__ == "__main__":
+    test_screen_capture()