Remove VisionBridge OCR (unused)

VisionBridge was a Swift library for Apple Vision OCR that was built every compile but never actually used by any g3 tool. Removed: - vision-bridge/ Swift package directory - src/ocr/ module (vision.rs, tesseract.rs, mod.rs) - OCR methods from ComputerController trait - OCR-related code from platform implementations - TextLocation type (no longer needed) - test_vision.rs example Simplified: - build.rs (now empty, no Swift compilation) - MacOSController (no longer holds OCR engine) - LinuxController and WindowsController (stub implementations) Build time improvement: No more 'Building VisionBridge Swift package...' messages on every compile.
2026-01-21 06:42:01 +05:30
parent 38b0019ad4
commit a89cad955a
13 changed files with 22 additions and 1292 deletions
--- a/crates/g3-computer-control/src/platform/linux.rs
+++ b/crates/g3-computer-control/src/platform/linux.rs
@@ -1,188 +1,32 @@
-use crate::{types::*, ComputerController};
+use crate::{types::Rect, ComputerController};
 use anyhow::Result;
 use async_trait::async_trait;
-use tesseract::Tesseract;
-use uuid::Uuid;

-pub struct LinuxController {
-    // Placeholder for X11 connection or other state
-}
+pub struct LinuxController;

 impl LinuxController {
    pub fn new() -> Result<Self> {
-        // Initialize X11 connection
        tracing::warn!("Linux computer control not fully implemented");
-        Ok(Self {})
+        Ok(Self)
    }
 }

 #[async_trait]
 impl ComputerController for LinuxController {
-    async fn move_mouse(&self, _x: i32, _y: i32) -> Result<()> {
-        anyhow::bail!("Linux implementation not yet available")
-    }
-
-    async fn click(&self, _button: MouseButton) -> Result<()> {
-        anyhow::bail!("Linux implementation not yet available")
-    }
-
-    async fn double_click(&self, _button: MouseButton) -> Result<()> {
-        anyhow::bail!("Linux implementation not yet available")
-    }
-
-    async fn type_text(&self, _text: &str) -> Result<()> {
-        anyhow::bail!("Linux implementation not yet available")
-    }
-
-    async fn press_key(&self, _key: &str) -> Result<()> {
-        anyhow::bail!("Linux implementation not yet available")
-    }
-
-    async fn list_windows(&self) -> Result<Vec<Window>> {
-        anyhow::bail!("Linux implementation not yet available")
-    }
-
-    async fn focus_window(&self, _window_id: &str) -> Result<()> {
-        anyhow::bail!("Linux implementation not yet available")
-    }
-
-    async fn get_window_bounds(&self, _window_id: &str) -> Result<Rect> {
-        anyhow::bail!("Linux implementation not yet available")
-    }
-
-    async fn find_element(&self, _selector: &ElementSelector) -> Result<Option<UIElement>> {
-        anyhow::bail!("Linux implementation not yet available")
-    }
-
-    async fn get_element_text(&self, _element_id: &str) -> Result<String> {
-        anyhow::bail!("Linux implementation not yet available")
-    }
-
-    async fn get_element_bounds(&self, _element_id: &str) -> Result<Rect> {
-        anyhow::bail!("Linux implementation not yet available")
-    }
-
    async fn take_screenshot(
        &self,
        _path: &str,
        _region: Option<Rect>,
        _window_id: Option<&str>,
    ) -> Result<()> {
-        // Enforce that window_id must be provided
-        if _window_id.is_none() {
-            anyhow::bail!("window_id is required. You must specify which window to capture (e.g., 'Firefox', 'Terminal', 'gedit'). Use list_windows to see available windows.");
-        }
-
-        anyhow::bail!("Linux implementation not yet available")
+        anyhow::bail!("Linux screenshot implementation not yet available")
    }

-    async fn extract_text_from_screen(&self, _region: Rect, _window_id: &str) -> Result<String> {
-        anyhow::bail!("Linux implementation not yet available")
+    fn move_mouse(&self, _x: i32, _y: i32) -> Result<()> {
+        anyhow::bail!("Linux mouse control not yet available")
    }

-    async fn extract_text_from_image(&self, _path: &str) -> Result<OCRResult> {
-        // Check if tesseract is available on the system
-        let tesseract_check = std::process::Command::new("which")
-            .arg("tesseract")
-            .output();
-
-        if tesseract_check.is_err() || !tesseract_check.as_ref().unwrap().status.success() {
-            anyhow::bail!(
-                "Tesseract OCR is not installed on your system.\n\n\
-                To install tesseract:\n  \
-                Ubuntu/Debian: sudo apt-get install tesseract-ocr\n  \
-                RHEL/CentOS:   sudo yum install tesseract\n  \
-                Arch Linux:    sudo pacman -S tesseract\n\n\
-                After installation, restart your terminal and try again."
-            );
-        }
-
-        // Initialize Tesseract
-        let tess = Tesseract::new(None, Some("eng")).map_err(|e| {
-            anyhow::anyhow!(
-                "Failed to initialize Tesseract: {}\n\n\
-                    This usually means:\n1. Tesseract is not properly installed\n\
-                    2. Language data files are missing\n\nTo fix:\n  \
-                    Ubuntu/Debian: sudo apt-get install tesseract-ocr-eng\n  \
-                    RHEL/CentOS:   sudo yum install tesseract-langpack-eng\n  \
-                    Arch Linux:    sudo pacman -S tesseract-data-eng",
-                e
-            )
-        })?;
-
-        let text = tess
-            .set_image(_path)
-            .map_err(|e| anyhow::anyhow!("Failed to load image '{}': {}", _path, e))?
-            .get_text()
-            .map_err(|e| anyhow::anyhow!("Failed to extract text from image: {}", e))?;
-
-        // Get confidence (simplified - would need more complex API calls for per-word confidence)
-        let confidence = 0.85; // Placeholder
-
-        Ok(OCRResult {
-            text,
-            confidence,
-            bounds: Rect {
-                x: 0,
-                y: 0,
-                width: 0,
-                height: 0,
-            }, // Would need image dimensions
-        })
-    }
-
-    async fn find_text_on_screen(&self, _text: &str) -> Result<Option<Point>> {
-        // Check if tesseract is available on the system
-        let tesseract_check = std::process::Command::new("which")
-            .arg("tesseract")
-            .output();
-
-        if tesseract_check.is_err() || !tesseract_check.as_ref().unwrap().status.success() {
-            anyhow::bail!(
-                "Tesseract OCR is not installed on your system.\n\n\
-                To install tesseract:\n  \
-                Ubuntu/Debian: sudo apt-get install tesseract-ocr\n  \
-                RHEL/CentOS:   sudo yum install tesseract\n  \
-                Arch Linux:    sudo pacman -S tesseract\n\n\
-                After installation, restart your terminal and try again."
-            );
-        }
-
-        // Take full screen screenshot
-        let temp_path = format!("/tmp/g3_ocr_search_{}.png", uuid::Uuid::new_v4());
-        self.take_screenshot(&temp_path, None, None).await?;
-
-        // Use Tesseract to find text with bounding boxes
-        let tess = Tesseract::new(None, Some("eng")).map_err(|e| {
-            anyhow::anyhow!(
-                "Failed to initialize Tesseract: {}\n\n\
-                    This usually means:\n1. Tesseract is not properly installed\n\
-                    2. Language data files are missing\n\nTo fix:\n  \
-                    Ubuntu/Debian: sudo apt-get install tesseract-ocr-eng\n  \
-                    RHEL/CentOS:   sudo yum install tesseract-langpack-eng\n  \
-                    Arch Linux:    sudo pacman -S tesseract-data-eng",
-                e
-            )
-        })?;
-
-        let full_text = tess
-            .set_image(temp_path.as_str())
-            .map_err(|e| anyhow::anyhow!("Failed to load screenshot: {}", e))?
-            .get_text()
-            .map_err(|e| anyhow::anyhow!("Failed to extract text from screen: {}", e))?;
-
-        // Clean up temp file
-        let _ = std::fs::remove_file(&temp_path);
-
-        // Simple text search - full implementation would use get_component_images
-        // to get bounding boxes for each word
-        if full_text.contains(_text) {
-            tracing::warn!(
-                "Text found but precise coordinates not available in simplified implementation"
-            );
-            Ok(Some(Point { x: 0, y: 0 }))
-        } else {
-            Ok(None)
-        }
+    fn click_at(&self, _x: i32, _y: i32, _app_name: Option<&str>) -> Result<()> {
+        anyhow::bail!("Linux click control not yet available")
    }
 }
--- a/crates/g3-computer-control/src/platform/macos.rs
+++ b/crates/g3-computer-control/src/platform/macos.rs
@@ -1,7 +1,5 @@
-use crate::ocr::{DefaultOCR, OCREngine};
 use crate::{
-    types::{Rect, TextLocation},
-    ComputerController,
+    types::Rect, ComputerController,
 };
 use anyhow::{Context, Result};
 use async_trait::async_trait;
@@ -14,21 +12,12 @@ use core_graphics::window::{
 };
 use std::path::Path;

-pub struct MacOSController {
-    ocr_engine: Box<dyn OCREngine>,
-    #[allow(dead_code)]
-    ocr_name: String,
-}
+pub struct MacOSController;

 impl MacOSController {
    pub fn new() -> Result<Self> {
-        let ocr = Box::new(DefaultOCR::new()?);
-        let ocr_name = ocr.name().to_string();
-        tracing::debug!("Initialized macOS controller with OCR engine: {}", ocr_name);
-        Ok(Self {
-            ocr_engine: ocr,
-            ocr_name,
-        })
+        tracing::debug!("Initialized macOS controller");
+        Ok(Self)
    }
 }

@@ -215,78 +204,6 @@ impl ComputerController for MacOSController {
        Ok(())
    }

-    async fn extract_text_from_screen(&self, region: Rect, window_id: &str) -> Result<String> {
-        // Take screenshot of region first
-        let temp_path = format!("/tmp/g3_ocr_{}.png", uuid::Uuid::new_v4());
-        self.take_screenshot(&temp_path, Some(region), Some(window_id))
-            .await?;
-
-        // Extract text from the screenshot
-        let result = self.extract_text_from_image(&temp_path).await?;
-
-        // Clean up temp file
-        let _ = std::fs::remove_file(&temp_path);
-
-        Ok(result)
-    }
-
-    async fn extract_text_from_image(&self, path: &str) -> Result<String> {
-        // Extract all text and concatenate
-        let locations = self.ocr_engine.extract_text_with_locations(path).await?;
-        Ok(locations
-            .iter()
-            .map(|loc| loc.text.as_str())
-            .collect::<Vec<_>>()
-            .join(" "))
-    }
-
-    async fn extract_text_with_locations(&self, path: &str) -> Result<Vec<TextLocation>> {
-        // Use the OCR engine
-        self.ocr_engine.extract_text_with_locations(path).await
-    }
-
-    async fn find_text_in_app(
-        &self,
-        app_name: &str,
-        search_text: &str,
-    ) -> Result<Option<TextLocation>> {
-        // Take screenshot of specific app window
-        let home = std::env::var("HOME").unwrap_or_else(|_| "/tmp".to_string());
-        let temp_path = format!(
-            "{}/tmp/g3_find_text_{}_{}.png",
-            home,
-            app_name,
-            uuid::Uuid::new_v4()
-        );
-        self.take_screenshot(&temp_path, None, Some(app_name))
-            .await?;
-
-        // Get screenshot dimensions before we delete it
-        let screenshot_dims = get_image_dimensions(&temp_path)?;
-
-        // Extract all text with locations
-        let locations = self.extract_text_with_locations(&temp_path).await?;
-
-        // Get window bounds to calculate coordinate transformation
-        let window_bounds = self.get_window_bounds(app_name)?;
-
-        // Clean up temp file
-        let _ = std::fs::remove_file(&temp_path);
-
-        // Find matching text (case-insensitive)
-        let search_lower = search_text.to_lowercase();
-        for location in locations {
-            if location.text.to_lowercase().contains(&search_lower) {
-                // Transform coordinates from screenshot space to screen space
-                let transformed =
-                    transform_screenshot_to_screen_coords(location, window_bounds, screenshot_dims);
-                return Ok(Some(transformed));
-            }
-        }
-
-        Ok(None)
-    }
-
    fn move_mouse(&self, x: i32, y: i32) -> Result<()> {
        use core_graphics::event::{CGEvent, CGEventTapLocation, CGEventType, CGMouseButton};
        use core_graphics::event_source::{CGEventSource, CGEventSourceStateID};
@@ -379,246 +296,6 @@ impl ComputerController for MacOSController {
    }
 }

-impl MacOSController {
-    /// Get window bounds for an application (helper method)
-    fn get_window_bounds(&self, app_name: &str) -> Result<(i32, i32, i32, i32)> {
-        unsafe {
-            let window_list =
-                CGWindowListCopyWindowInfo(kCGWindowListOptionOnScreenOnly, kCGNullWindowID);
-
-            let array = CFArray::<CFDictionary>::wrap_under_create_rule(window_list);
-            let count = array.len();
-
-            let app_name_lower = app_name.to_lowercase();
-
-            for i in 0..count {
-                let dict = array.get(i).unwrap();
-
-                // Get owner name
-                let owner_key = CFString::from_static_string("kCGWindowOwnerName");
-                let owner: String = if let Some(value) = dict.find(owner_key.to_void()) {
-                    let s: CFString = TCFType::wrap_under_get_rule(*value as *const _);
-                    s.to_string()
-                } else {
-                    continue;
-                };
-
-                let owner_lower = owner.to_lowercase();
-
-                // Normalize by removing spaces for exact matching
-                let app_name_normalized = app_name_lower.replace(" ", "");
-                let owner_normalized = owner_lower.replace(" ", "");
-
-                // ONLY accept exact matches (case-insensitive, with or without spaces)
-                // This prevents "Goose" from matching "GooseStudio"
-                let is_match =
-                    owner_lower == app_name_lower || owner_normalized == app_name_normalized;
-
-                if is_match {
-                    // Get window layer to filter out menu bar windows
-                    let layer_key = CFString::from_static_string("kCGWindowLayer");
-                    let layer: i32 = if let Some(value) = dict.find(layer_key.to_void()) {
-                        let num: core_foundation::number::CFNumber =
-                            TCFType::wrap_under_get_rule(*value as *const _);
-                        num.to_i32().unwrap_or(0)
-                    } else {
-                        0
-                    };
-
-                    // Skip menu bar windows (layer >= 20)
-                    if layer >= 20 {
-                        tracing::debug!(
-                            "Skipping window for '{}' at layer {} (menu bar)",
-                            owner,
-                            layer
-                        );
-                        continue;
-                    }
-
-                    // Get window bounds to verify it's a real window
-                    let bounds_key = CFString::from_static_string("kCGWindowBounds");
-                    if let Some(value) = dict.find(bounds_key.to_void()) {
-                        let bounds_dict: CFDictionary =
-                            TCFType::wrap_under_get_rule(*value as *const _);
-
-                        let x_key = CFString::from_static_string("X");
-                        let y_key = CFString::from_static_string("Y");
-                        let width_key = CFString::from_static_string("Width");
-                        let height_key = CFString::from_static_string("Height");
-
-                        if let (Some(x_val), Some(y_val), Some(w_val), Some(h_val)) = (
-                            bounds_dict.find(x_key.to_void()),
-                            bounds_dict.find(y_key.to_void()),
-                            bounds_dict.find(width_key.to_void()),
-                            bounds_dict.find(height_key.to_void()),
-                        ) {
-                            let x_num: core_foundation::number::CFNumber =
-                                TCFType::wrap_under_get_rule(*x_val as *const _);
-                            let y_num: core_foundation::number::CFNumber =
-                                TCFType::wrap_under_get_rule(*y_val as *const _);
-                            let w_num: core_foundation::number::CFNumber =
-                                TCFType::wrap_under_get_rule(*w_val as *const _);
-                            let h_num: core_foundation::number::CFNumber =
-                                TCFType::wrap_under_get_rule(*h_val as *const _);
-
-                            let x: i32 = x_num.to_i64().unwrap_or(0) as i32;
-                            let y: i32 = y_num.to_i64().unwrap_or(0) as i32;
-                            let w: i32 = w_num.to_i64().unwrap_or(0) as i32;
-                            let h: i32 = h_num.to_i64().unwrap_or(0) as i32;
-
-                            // Only accept windows with real bounds (>= 100x100 pixels)
-                            if w >= 100 && h >= 100 {
-                                tracing::debug!("Found valid window bounds for '{}': x={}, y={}, w={}, h={} (layer={})", owner, x, y, w, h, layer);
-                                return Ok((x, y, w, h));
-                            } else {
-                                tracing::debug!(
-                                    "Skipping window for '{}': too small ({}x{})",
-                                    owner,
-                                    w,
-                                    h
-                                );
-                                continue;
-                            }
-                        } else {
-                            continue;
-                        }
-                    }
-                }
-            }
-        }
-
-        Err(anyhow::anyhow!(
-            "Could not find window bounds for '{}'",
-            app_name
-        ))
-    }
-}
-
-/// Get image dimensions from a PNG file
-fn get_image_dimensions(path: &str) -> Result<(i32, i32)> {
-    use std::fs::File;
-    use std::io::Read;
-
-    let mut file = File::open(path)?;
-    let mut buffer = vec![0u8; 24];
-    file.read_exact(&mut buffer)?;
-
-    // PNG signature check
-    if &buffer[0..8] != b"\x89PNG\r\n\x1a\n" {
-        anyhow::bail!("Not a valid PNG file");
-    }
-
-    // Read IHDR chunk (width and height are at bytes 16-23)
-    let width = u32::from_be_bytes([buffer[16], buffer[17], buffer[18], buffer[19]]) as i32;
-    let height = u32::from_be_bytes([buffer[20], buffer[21], buffer[22], buffer[23]]) as i32;
-
-    Ok((width, height))
-}
-
-/// Transform coordinates from screenshot space to screen space
-///
-/// The screenshot is taken of a window, and Vision OCR returns coordinates
-/// relative to the screenshot image. We need to transform these to actual
-/// screen coordinates for clicking.
-///
-/// On Retina displays, screenshots are taken at 2x resolution, so we need
-/// to account for this scaling factor.
-fn transform_screenshot_to_screen_coords(
-    location: TextLocation,
-    window_bounds: (i32, i32, i32, i32), // (x, y, width, height) in screen space
-    screenshot_dims: (i32, i32),         // (width, height) in pixels
-) -> TextLocation {
-    let (win_x, win_y, win_width, win_height) = window_bounds;
-    let (screenshot_width, screenshot_height) = screenshot_dims;
-
-    // Calculate scale factors
-    // On Retina displays, screenshot is typically 2x the window size
-    let scale_x = win_width as f64 / screenshot_width as f64;
-    let scale_y = win_height as f64 / screenshot_height as f64;
-
-    tracing::debug!(
-        "Transform: screenshot={}x{}, window={}x{} at ({},{}), scale=({:.2},{:.2})",
-        screenshot_width,
-        screenshot_height,
-        win_width,
-        win_height,
-        win_x,
-        win_y,
-        scale_x,
-        scale_y
-    );
-
-    // Transform coordinates from image space to screen space
-    // IMPORTANT: macOS screen coordinates have origin at BOTTOM-LEFT (Y increases upward)
-    // Image coordinates have origin at TOP-LEFT (Y increases downward)
-    // win_y is the BOTTOM of the window in screen coordinates
-    // So we need to: (win_y + win_height) to get window TOP, then subtract screenshot_y
-    let window_top_y = win_y + win_height;
-
-    tracing::debug!(
-        "[transform] Input location in image space: x={}, y={}, width={}, height={}",
-        location.x,
-        location.y,
-        location.width,
-        location.height
-    );
-    tracing::debug!(
-        "[transform] Scale factors: scale_x={:.4}, scale_y={:.4}",
-        scale_x,
-        scale_y
-    );
-
-    let transformed_x = win_x + (location.x as f64 * scale_x) as i32;
-    let transformed_y = window_top_y - (location.y as f64 * scale_y) as i32;
-    let transformed_width = (location.width as f64 * scale_x) as i32;
-    let transformed_height = (location.height as f64 * scale_y) as i32;
-
-    tracing::debug!("[transform] Calculation details:");
-    tracing::debug!(
-        "  - transformed_x = {} + ({} * {:.4}) = {} + {:.2} = {}",
-        win_x,
-        location.x,
-        scale_x,
-        win_x,
-        location.x as f64 * scale_x,
-        transformed_x
-    );
-    tracing::debug!(
-        "  - transformed_width = ({} * {:.4}) = {:.2} -> {}",
-        location.width,
-        scale_x,
-        location.width as f64 * scale_x,
-        transformed_width
-    );
-    tracing::debug!(
-        "  - transformed_height = ({} * {:.4}) = {:.2} -> {}",
-        location.height,
-        scale_y,
-        location.height as f64 * scale_y,
-        transformed_height
-    );
-
-    tracing::debug!(
-        "Transformed location: screenshot=({},{}) {}x{} -> screen=({},{}) {}x{}",
-        location.x,
-        location.y,
-        location.width,
-        location.height,
-        transformed_x,
-        transformed_y,
-        transformed_width,
-        transformed_height
-    );
-
-    TextLocation {
-        text: location.text,
-        x: transformed_x,
-        y: transformed_y,
-        width: transformed_width,
-        height: transformed_height,
-        confidence: location.confidence,
-    }
-}

 #[path = "macos_window_matching_test.rs"]
 #[cfg(test)]
--- a/crates/g3-computer-control/src/platform/windows.rs
+++ b/crates/g3-computer-control/src/platform/windows.rs
@@ -1,189 +1,32 @@
-use crate::{types::*, ComputerController};
+use crate::{types::Rect, ComputerController};
 use anyhow::Result;
 use async_trait::async_trait;
-use tesseract::Tesseract;
-use uuid::Uuid;

-pub struct WindowsController {
-    // Placeholder for Windows-specific state
-}
+pub struct WindowsController;

 impl WindowsController {
    pub fn new() -> Result<Self> {
        tracing::warn!("Windows computer control not fully implemented");
-        Ok(Self {})
+        Ok(Self)
    }
 }

 #[async_trait]
 impl ComputerController for WindowsController {
-    async fn move_mouse(&self, _x: i32, _y: i32) -> Result<()> {
-        anyhow::bail!("Windows implementation not yet available")
-    }
-
-    async fn click(&self, _button: MouseButton) -> Result<()> {
-        anyhow::bail!("Windows implementation not yet available")
-    }
-
-    async fn double_click(&self, _button: MouseButton) -> Result<()> {
-        anyhow::bail!("Windows implementation not yet available")
-    }
-
-    async fn type_text(&self, _text: &str) -> Result<()> {
-        anyhow::bail!("Windows implementation not yet available")
-    }
-
-    async fn press_key(&self, _key: &str) -> Result<()> {
-        anyhow::bail!("Windows implementation not yet available")
-    }
-
-    async fn list_windows(&self) -> Result<Vec<Window>> {
-        anyhow::bail!("Windows implementation not yet available")
-    }
-
-    async fn focus_window(&self, _window_id: &str) -> Result<()> {
-        anyhow::bail!("Windows implementation not yet available")
-    }
-
-    async fn get_window_bounds(&self, _window_id: &str) -> Result<Rect> {
-        anyhow::bail!("Windows implementation not yet available")
-    }
-
-    async fn find_element(&self, _selector: &ElementSelector) -> Result<Option<UIElement>> {
-        anyhow::bail!("Windows implementation not yet available")
-    }
-
-    async fn get_element_text(&self, _element_id: &str) -> Result<String> {
-        anyhow::bail!("Windows implementation not yet available")
-    }
-
-    async fn get_element_bounds(&self, _element_id: &str) -> Result<Rect> {
-        anyhow::bail!("Windows implementation not yet available")
-    }
-
    async fn take_screenshot(
        &self,
        _path: &str,
        _region: Option<Rect>,
        _window_id: Option<&str>,
    ) -> Result<()> {
-        // Enforce that window_id must be provided
-        if _window_id.is_none() {
-            anyhow::bail!("window_id is required. You must specify which window to capture (e.g., 'Chrome', 'Terminal', 'Notepad'). Use list_windows to see available windows.");
-        }
-
-        anyhow::bail!("Windows implementation not yet available")
+        anyhow::bail!("Windows screenshot implementation not yet available")
    }

-    async fn extract_text_from_screen(&self, _region: Rect, _window_id: &str) -> Result<String> {
-        anyhow::bail!("Windows implementation not yet available")
+    fn move_mouse(&self, _x: i32, _y: i32) -> Result<()> {
+        anyhow::bail!("Windows mouse control not yet available")
    }

-    async fn extract_text_from_image(&self, _path: &str) -> Result<OCRResult> {
-        // Check if tesseract is available on the system
-        let tesseract_check = std::process::Command::new("where")
-            .arg("tesseract")
-            .output();
-
-        if tesseract_check.is_err() || !tesseract_check.as_ref().unwrap().status.success() {
-            anyhow::bail!(
-                "Tesseract OCR is not installed on your system.\n\n\
-                To install tesseract on Windows:\n  \
-                1. Download the installer from: https://github.com/UB-Mannheim/tesseract/wiki\n  \
-                2. Run the installer and follow the instructions\n  \
-                3. Add tesseract to your PATH environment variable\n  \
-                4. Restart your terminal/command prompt\n\n\
-                After installation, restart your terminal and try again."
-            );
-        }
-
-        // Initialize Tesseract
-        let tess = Tesseract::new(None, Some("eng")).map_err(|e| {
-            anyhow::anyhow!(
-                "Failed to initialize Tesseract: {}\n\n\
-                    This usually means:\n1. Tesseract is not properly installed\n\
-                    2. Language data files are missing\n\nTo fix:\n  \
-                    1. Reinstall tesseract from https://github.com/UB-Mannheim/tesseract/wiki\n  \
-                    2. Make sure to select 'Additional language data' during installation\n  \
-                    3. Ensure tesseract is in your PATH",
-                e
-            )
-        })?;
-
-        let text = tess
-            .set_image(_path)
-            .map_err(|e| anyhow::anyhow!("Failed to load image '{}': {}", _path, e))?
-            .get_text()
-            .map_err(|e| anyhow::anyhow!("Failed to extract text from image: {}", e))?;
-
-        // Get confidence (simplified - would need more complex API calls for per-word confidence)
-        let confidence = 0.85; // Placeholder
-
-        Ok(OCRResult {
-            text,
-            confidence,
-            bounds: Rect {
-                x: 0,
-                y: 0,
-                width: 0,
-                height: 0,
-            }, // Would need image dimensions
-        })
-    }
-
-    async fn find_text_on_screen(&self, _text: &str) -> Result<Option<Point>> {
-        // Check if tesseract is available on the system
-        let tesseract_check = std::process::Command::new("where")
-            .arg("tesseract")
-            .output();
-
-        if tesseract_check.is_err() || !tesseract_check.as_ref().unwrap().status.success() {
-            anyhow::bail!(
-                "Tesseract OCR is not installed on your system.\n\n\
-                To install tesseract on Windows:\n  \
-                1. Download the installer from: https://github.com/UB-Mannheim/tesseract/wiki\n  \
-                2. Run the installer and follow the instructions\n  \
-                3. Add tesseract to your PATH environment variable\n  \
-                4. Restart your terminal/command prompt\n\n\
-                After installation, restart your terminal and try again."
-            );
-        }
-
-        // Take full screen screenshot
-        let temp_path = format!("C:\\\\Temp\\\\g3_ocr_search_{}.png", uuid::Uuid::new_v4());
-        self.take_screenshot(&temp_path, None, None).await?;
-
-        // Use Tesseract to find text with bounding boxes
-        let tess = Tesseract::new(None, Some("eng")).map_err(|e| {
-            anyhow::anyhow!(
-                "Failed to initialize Tesseract: {}\n\n\
-                    This usually means:\n1. Tesseract is not properly installed\n\
-                    2. Language data files are missing\n\nTo fix:\n  \
-                    1. Reinstall tesseract from https://github.com/UB-Mannheim/tesseract/wiki\n  \
-                    2. Make sure to select 'Additional language data' during installation\n  \
-                    3. Ensure tesseract is in your PATH",
-                e
-            )
-        })?;
-
-        let full_text = tess
-            .set_image(temp_path.as_str())
-            .map_err(|e| anyhow::anyhow!("Failed to load screenshot: {}", e))?
-            .get_text()
-            .map_err(|e| anyhow::anyhow!("Failed to extract text from screen: {}", e))?;
-
-        // Clean up temp file
-        let _ = std::fs::remove_file(&temp_path);
-
-        // Simple text search - full implementation would use get_component_images
-        // to get bounding boxes for each word
-        if full_text.contains(_text) {
-            tracing::warn!(
-                "Text found but precise coordinates not available in simplified implementation"
-            );
-            Ok(Some(Point { x: 0, y: 0 }))
-        } else {
-            Ok(None)
-        }
+    fn click_at(&self, _x: i32, _y: i32, _app_name: Option<&str>) -> Result<()> {
+        anyhow::bail!("Windows click control not yet available")
    }
 }