plotly.rs/plotly_static/src/webdriver.rs at make-subplots · plotly/plotly.rs

669 lines (593 loc) · 24.5 KB
//! WebDriver management module for plotly_static.
//! This module provides WebDriver process management, including:
//! - Automatic detection of existing WebDriver sessions
//! - Process spawning and lifecycle management
//! - Connection reuse and cleanup
//! - Support for both spawned and external WebDriver instances
//! The module is designed to work safely in parallel environments.
use std::io::prelude::*;
use std::io::BufReader;
use std::path::PathBuf;
use std::process::{Child, Command, Stdio};
use std::sync::{Arc, Mutex};
use std::thread;
#[cfg(any(test, feature = "debug"))]
use std::{println as info, println as error, println as debug, println as warn, println as trace};
use anyhow::{anyhow, Result};
#[cfg(not(any(test, feature = "debug")))]
use log::{debug, error, info, trace, warn};
/// Environment variable for specifying the WebDriver binary path
const WEBDRIVER_PATH_ENV: &str = "WEBDRIVER_PATH";
#[cfg(feature = "geckodriver")]
const WEBDRIVER_BIN: &str = "geckodriver";
#[cfg(feature = "chromedriver")]
const WEBDRIVER_BIN: &str = "chromedriver";
/// Default WebDriver port
pub(crate) const WEBDRIVER_PORT: u32 = 4444;
/// Default WebDriver URL
pub(crate) const WEBDRIVER_URL: &str = "http://127.0.0.1";
#[cfg(all(feature = "chromedriver", not(target_os = "windows")))]
pub(crate) fn chrome_default_caps() -> Vec<&'static str> {
        "--headless",
        "--no-sandbox",
        "--disable-gpu-sandbox",
        "--disable-dev-shm-usage",
        "--disable-extensions",
        "--disable-background-networking",
        "--disable-sync",
        "--disable-translate",
        "--disable-background-timer-throttling",
        "--disable-renderer-backgrounding",
        "--disable-features=VizDisplayCompositor",
        "--memory-pressure-off",
        // macOS-specific flags from choreographer
        "--enable-unsafe-swiftshader",
        "--use-mock-keychain",
        "--password-store=basic",
        "--disable-web-security",
        "--disable-breakpad",
        "--no-first-run",
        "--no-default-browser-check",
        // Additional flags for better PDF generation support
        "--disable-backgrounding-occluded-windows",
        "--disable-ipc-flooding-protection",
        "--enable-logging",
        "--v=1",
#[cfg(all(feature = "chromedriver", target_os = "windows"))]
pub(crate) fn chrome_default_caps() -> Vec<&'static str> {
        "--headless=new",
        "--no-sandbox",
        "--disable-dev-shm-usage",
        "--disable-breakpad",
        "--no-first-run",
        "--no-default-browser-check",
        // Stability flags to prevent renderer crashes
        "--disable-background-networking",
        "--disable-sync",
        "--disable-translate",
        "--disable-background-timer-throttling",
        "--disable-renderer-backgrounding",
        "--disable-backgrounding-occluded-windows",
        "--disable-ipc-flooding-protection",
        "--disable-extensions",
        // Minimal flags for Windows headless operation without disabling GPU
        "--hide-scrollbars",
        "--mute-audio",
        "--use-angle=swiftshader",
        "--disable-software-rasterizer",
#[cfg(feature = "geckodriver")]
pub(crate) fn firefox_default_caps() -> Vec<&'static str> {
        "-headless",   // Essential for headless operation (single dash for Firefox)
        "--no-remote", // Prevents connecting to existing Firefox instances
/// Internal WebDriver state
#[derive(Debug)]
struct WdInner {
    webdriver_port: u32,
    driver_path: Option<PathBuf>,
    webdriver_child: Option<Child>,
    is_external: bool, /* Marker for whether this WebDriver was spawned by us or connected to
                        * existing */
/// WebDriver management struct
/// This struct provides WebDriver process management with the following
/// features:
/// - Automatic detection of existing WebDriver sessions
/// - Process spawning and lifecycle management
/// - Connection reuse and cleanup
/// - Support for both spawned and external WebDriver instances
/// - Thread-safe operations using Arc<Mutex<>> for internal state
#[derive(Debug)]
pub struct WebDriver {
    inner: Arc<Mutex<WdInner>>,
impl WebDriver {
    /// Creates a new WebDriver instance for spawning.
    /// This method creates a WebDriver instance that will later spawn a new
    /// process. It looks for the WebDriver binary in the following order:
    /// 1. `WEBDRIVER_PATH` environment variable (should point to full
    ///    executable path)
    /// 2. Build-time downloaded path (if `webdriver_download` feature is
    ///    enabled)
    /// Returns a `Result<WebDriver>` where:
    /// - `Ok(webdriver)` - Successfully created the WebDriver instance
    /// - `Err(e)` - Failed to create the instance (e.g., binary not found)
    pub(crate) fn new(port: u32) -> Result<Self> {
        let full_path = Self::get_webdriver_path()?;
        Ok(Self {
            inner: Arc::new(Mutex::new(WdInner {
                webdriver_port: port,
                driver_path: Some(full_path),
                webdriver_child: None,
                is_external: false, // mark it as spawned by us
            })),
    /// Spawn a new WebDriver instance, connecting to existing if available.
    /// This method provides WebDriver management:
    /// 1. First checks if a WebDriver is already running on the specified port
    /// 2. If found, connects to the existing session
    /// 3. If not found, spawns a process of the current WebDriver instance
    /// This approach allows for efficient resource usage and supports both
    /// scenarios where WebDriver is managed externally or needs to be spawned.
    /// Returns a `Result<WebDriver>` where:
    /// - `Ok(webdriver)` - Successfully created or connected to WebDriver
    /// - `Err(e)` - Failed to create or connect to WebDriver
    pub(crate) fn connect_or_spawn(port: u32) -> Result<Self> {
        match Self::try_connect(port) {
            Some(active_instance) => Ok(active_instance),
            None => Self::spawn(port)
                .map_err(|e| anyhow!("Failed to spawn new WebDriver on port {}: {}", port, e)),
    /// Try connecting to an existing WebDriver instance
    pub(crate) fn try_connect(port: u32) -> Option<Self> {
        if !Self::is_webdriver_running(port) {
            return None;
        info!("WebDriver already running on port {port}, connecting to existing session");
        Self::no_spawn_instance(port).ok()
    /// Create a new WebDriver instance without a path to the webdriver binary,
    /// as it is used for connecting to an existing WebDriver session and not
    /// spawning a new process.
    pub(crate) fn no_spawn_instance(port: u32) -> Result<Self> {
        Ok(Self {
            inner: Arc::new(Mutex::new(WdInner {
                webdriver_port: port,
                driver_path: None,
                webdriver_child: None,
                is_external: true, // Mark as external since we didn't spawn it
            })),
    /// Spawns the WebDriver process
    /// This method starts the WebDriver process in a background thread and
    /// captures its output for logging. The process is spawned with the
    /// specified port and appropriate I/O redirection.
    /// The spawned process will be automatically managed and can be stopped
    /// using the `stop()` method.
    pub(crate) fn spawn(port: u32) -> Result<Self> {
        debug!("No WebDriver running on port {port}, creating new instance and spawning");
        let mut wd = Self::new(port)?;
        wd.spawn_webdriver()?;
        if Self::is_webdriver_running(port) {
            info!("Successfully created and started WebDriver on port {port}");
            Ok(wd)
        } else {
            let diagnostics = wd.get_diagnostics();
            error!(
                "WebDriver failed to start properly on port {port}. Diagnostics:\n{diagnostics}"
            Err(anyhow!(
                "WebDriver failed to start properly on port {}",
    pub(crate) fn spawn_webdriver(&mut self) -> Result<()> {
        let port = self.inner.lock().unwrap().webdriver_port;
        let driver_path = self.inner.lock().unwrap().driver_path.clone();
        info!("Spawning {WEBDRIVER_BIN} on port {port} with path: {driver_path:?}");
        if Self::is_webdriver_running(port) {
            warn!("WebDriver already running on port {port}, attempting to connect instead");
            return Ok(());
        self.validate_spawn_prerequisites()?;
        let mut child = self.spawn_process(&driver_path, port)?;
        self.setup_output_monitoring(&mut child, port);
        self.store_child_process(child);
        self.wait_for_ready(port)
    fn validate_spawn_prerequisites(&self) -> Result<()> {
        let inner = self
            .inner
            .lock()
            .map_err(|e| anyhow!("Failed to acquire lock: {}", e))?;
        // Check if driver path exists
        let driver_path = inner.driver_path.as_ref().ok_or_else(|| {
            error!(
                "WebDriver diagnostics after missing driver path:\n{}",
                self.get_diagnostics()
            anyhow!("No driver path available for spawning")
        })?;
        // Check if binary exists
        if !driver_path.exists() {
            error!(
                "WebDriver diagnostics after missing binary:\n{}",
                self.get_diagnostics()
            return Err(anyhow!("WebDriver binary does not exist: {driver_path:?}"));
        Ok(())
    fn spawn_process(&self, driver_path: &Option<PathBuf>, port: u32) -> Result<Child> {
        let driver_path = driver_path.as_ref().unwrap(); // Safe unwrap since we validated above
        let mut command = Self::create_command(driver_path, port);
        Self::log_command(&command);
        match command.spawn() {
            Ok(child) => Ok(child),
            Err(e) => {
                #[cfg(not(target_os = "windows"))]
                    Err(self.handle_spawn_error(e, &command, "standard method"))
                #[cfg(target_os = "windows")]
                    self.spawn_with_fallback(driver_path, port, e)
    /// Windows-specific fallback spawn method when CREATE_NO_WINDOW fails
    #[cfg(target_os = "windows")]
    fn spawn_with_fallback(
        &self,
        driver_path: &PathBuf,
        port: u32,
        original_error: std::io::Error,
    ) -> Result<Child> {
        // If CREATE_NO_WINDOW fails, try without any special flags
        error!("Failed to spawn with CREATE_NO_WINDOW: {original_error}");
        error!("Trying without special creation flags...");
        let mut fallback_command = Self::standard_command(driver_path, port);
        Self::log_command(&fallback_command);
        match fallback_command.spawn() {
            Ok(child) => {
                info!("Successfully spawned WebDriver without special creation flags");
                Ok(child)
            Err(fallback_e) => {
                error!("Original error: {original_error}");
                error!("Fallback error: {fallback_e}");
                Err(self.handle_spawn_error(fallback_e, &fallback_command, "fallback method"))
    /// Creates a command with standard configuration (no Windows flags)
    fn standard_command(driver_path: &PathBuf, port: u32) -> Command {
        let mut command = Command::new(driver_path);
        command.arg(format!("--port={port}"));
        // Add verbose flag only for chromedriver
        #[cfg(feature = "chromedriver")]
        command.arg("--verbose");
        command
            .stdin(Stdio::piped())
            .stdout(Stdio::piped())
            .stderr(Stdio::piped());
        command
    /// Creates a command with Windows-specific flags
    #[cfg(target_os = "windows")]
    fn create_command(driver_path: &PathBuf, port: u32) -> Command {
        use std::os::windows::process::CommandExt;
        let mut command = Self::standard_command(driver_path, port);
        // Try with CREATE_NO_WINDOW for headless operation
        command.creation_flags(0x08000000); // CREATE_NO_WINDOW flag
        command
    #[cfg(not(target_os = "windows"))]
    fn create_command(driver_path: &PathBuf, port: u32) -> Command {
        Self::standard_command(driver_path, port)
    /// Logs command execution details
    fn log_command(command: &Command) {
        info!(
            "Executing command: {:?} {:?}",
            command.get_program(),
            command.get_args()
    /// Handles spawn errors with appropriate logging and diagnostics
    fn handle_spawn_error(
        &self,
        e: std::io::Error,
        command: &Command,
        attempt: &str,
    ) -> anyhow::Error {
        error!("Failed to spawn '{WEBDRIVER_BIN}' with {attempt}: {e}");
        error!(
            "Command was: {:?} {:?}",
            command.get_program(),
            command.get_args()
        #[cfg(target_os = "windows")]
        if attempt == "CREATE_NO_WINDOW" {
            error!("Windows: Check if antivirus is blocking the process");
            error!("Windows: Check if the binary has proper permissions");
        error!(
            "WebDriver diagnostics after spawn failure:\n{}",
            self.get_diagnostics()
        anyhow!("Failed to spawn '{WEBDRIVER_BIN}': {}", e)
    fn setup_output_monitoring(&self, child: &mut Child, port: u32) {
        // Monitor stderr
        if let Some(stderr) = child.stderr.take() {
            let port_for_logging = port;
            thread::spawn(move || {
                info!("Starting stderr monitoring for WebDriver on port {port_for_logging}");
                let stderr_lines = BufReader::new(stderr).lines();
                for line in stderr_lines.map_while(Result::ok) {
                    trace!("WebDriver[{port_for_logging}] stderr: {line}");
                info!("Stderr monitoring ended for WebDriver on port {port_for_logging}");
        // Monitor stdout
        if let Some(stdout) = child.stdout.take() {
            let port_for_logging = port;
            thread::spawn(move || {
                info!("Starting stdout monitoring for WebDriver on port {port_for_logging}");
                let stdout_lines = BufReader::new(stdout).lines();
                for line in stdout_lines.map_while(Result::ok) {
                    trace!("WebDriver[{port_for_logging}] stdout: {line}");
                info!("Stdout monitoring ended for WebDriver on port {port_for_logging}");
    fn store_child_process(&mut self, child: Child) {
        let mut inner = self.inner.lock().unwrap();
        inner.webdriver_child = Some(child);
        info!("WebDriver process stored, waiting for it to become ready...");
    fn wait_for_ready(&self, port: u32) -> Result<()> {
        let start_time = std::time::Instant::now();
        let timeout_duration = if cfg!(target_os = "windows") {
            std::time::Duration::from_secs(60)
        } else {
            std::time::Duration::from_secs(30)
        while start_time.elapsed() < timeout_duration {
            if Self::is_webdriver_running(port) {
                info!(
                    "WebDriver is ready on port {} after {:?}",
                    start_time.elapsed()
                return Ok(());
            // Check if process is still alive
            if let Some(child) = self.inner.lock().unwrap().webdriver_child.as_mut() {
                if let Ok(Some(_)) = child.try_wait() {
                    error!("WebDriver process exited before becoming ready on port {port}");
                    return Err(anyhow!(
                        "WebDriver process exited before becoming ready on port {}",
            std::thread::sleep(std::time::Duration::from_millis(100));
        error!("WebDriver failed to become ready on port {port} within {timeout_duration:?}");
        Err(anyhow!(
            "WebDriver failed to become ready on port {} within {:?}",
            port,
            timeout_duration
    /// Stops the WebDriver process.
    /// This method manages WebDriver process termination:
    /// - Only terminates processes that were spawned by this instance
    /// - Leaves externally managed WebDriver sessions running
    /// - Logs warnings when attempting to stop external sessions
    /// Returns `Ok(())` on success, or an error if the process termination
    /// fails.
    pub fn stop(&mut self) -> Result<()> {
        let mut inner = self
            .inner
            .lock()
            .map_err(|e| anyhow!("Failed to acquire lock: {}", e))?;
        // Only stop the process if we spawned it (not if it's external)
        if !inner.is_external {
            if let Some(child) = inner.webdriver_child.as_mut() {
                info!("Stopping '{WEBDRIVER_BIN}' (PID: {})", child.id());
                let _ = child.kill();
                let _ = child.wait();
        } else {
            warn!(
                "Not stopping external WebDriver on port {} as it was not spawned by us",
                inner.webdriver_port
        Ok(())
    /// Get diagnostic information about the WebDriver process.
    /// This method provides detailed information about the WebDriver process
    /// for debugging purposes.
    /// Returns a string with diagnostic information.
    pub(crate) fn get_diagnostics(&self) -> String {
        let mut inner = self.inner.lock().unwrap();
        let mut diagnostics = String::new();
        diagnostics.push_str("WebDriver Diagnostics:\n");
        diagnostics.push_str(&format!("  Port: {}\n", inner.webdriver_port));
        diagnostics.push_str(&format!("  Driver Path: {:?}\n", inner.driver_path));
        diagnostics.push_str(&format!("  Is External: {}\n", inner.is_external));
        if let Some(child) = inner.webdriver_child.as_mut() {
            diagnostics.push_str(&format!("  Process ID: {}\n", child.id()));
            // Check if process is still running
            match child.try_wait() {
                Ok(None) => diagnostics.push_str("  Process Status: Running\n"),
                Ok(Some(status)) => {
                    diagnostics.push_str(&format!("  Process Status: Exited with {status:?}\n"))
                Err(e) => {
                    diagnostics.push_str(&format!("  Process Status: Error checking status: {e}\n"))
        } else {
            diagnostics.push_str("  Process ID: None (no child process)\n");
        // Check if WebDriver is responding
        let is_running = Self::is_webdriver_running(inner.webdriver_port);
        diagnostics.push_str(&format!("  WebDriver Responding: {is_running}\n"));
        // Check port availability
        let url = format!("{WEBDRIVER_URL}:{}/status", inner.webdriver_port);
        diagnostics.push_str(&format!("  Status URL: {url}\n"));
        #[cfg(target_os = "windows")]
            diagnostics.push_str("  Platform: Windows\n");
            // Check if port is in use using Windows-specific commands
            if let Ok(output) = std::process::Command::new("netstat").args(["-an"]).output() {
                let netstat_output = String::from_utf8_lossy(&output.stdout);
                if netstat_output.contains(&format!(":{}", inner.webdriver_port)) {
                    diagnostics.push_str(&format!(
                        "  Port {} appears to be in use (netstat)\n",
                        inner.webdriver_port
                } else {
                    diagnostics.push_str(&format!(
                        "  Port {} appears to be free (netstat)\n",
                        inner.webdriver_port
            // Check if chromedriver is in PATH (Windows-specific)
            #[cfg(all(target_os = "windows", feature = "chromedriver"))]
                if let Ok(output) = std::process::Command::new("where")
                    .arg("chromedriver")
                    .output()
                    let where_output = String::from_utf8_lossy(&output.stdout);
                    diagnostics
                        .push_str(&format!("  Chromedriver in PATH: {}", where_output.trim()));
                } else {
                    diagnostics.push_str("  Chromedriver not found in PATH\n");
            // Check if geckodriver is in PATH (Windows-specific)
            #[cfg(all(target_os = "windows", feature = "geckodriver"))]
                if let Ok(output) = std::process::Command::new("where")
                    .arg("geckodriver")
                    .output()
                    let where_output = String::from_utf8_lossy(&output.stdout);
                    diagnostics
                        .push_str(&format!("  Geckodriver in PATH: {}", where_output.trim()));
                } else {
                    diagnostics.push_str("  Geckodriver not found in PATH\n");
            // Check Windows Defender status (Windows-specific)
            #[cfg(target_os = "windows")]
                if let Ok(output) = std::process::Command::new("powershell")
                    .args([
                        "-Command",
                        "Get-MpComputerStatus | Select-Object RealTimeProtectionEnabled",
                    .output()
                    let defender_output = String::from_utf8_lossy(&output.stdout);
                    diagnostics.push_str(&format!(
                        "  Windows Defender Real-time Protection: {}",
                        defender_output.trim()
        diagnostics
    /// Check if a WebDriver is already running on the specified port.
    /// This method performs a WebDriver check by:
    /// 1. Making an HTTP GET request to `/status` endpoint
    /// 2. Checking for HTTP 200 response
    /// 3. Verifying the response contains "ready" indicating the service is
    ///    ready
    /// Returns `true` if WebDriver is running and ready, `false` otherwise.
    pub(crate) fn is_webdriver_running(port: u32) -> bool {
        let url = format!("{WEBDRIVER_URL}:{port}/status");
        // Add timeout to prevent hanging
        let client = reqwest::blocking::Client::builder()
            .timeout(std::time::Duration::from_secs(5))
            .build()
            .unwrap_or_else(|_| reqwest::blocking::Client::new());
        client
            .get(&url)
            .send()
            .ok()
            .filter(|response| response.status().as_u16() == 200)
            .and_then(|response| response.text().ok())
            .map(|text| text.contains("ready"))
            .unwrap_or(false)
    fn get_webdriver_path() -> Result<PathBuf> {
        use std::env;
        let path = match env::var(WEBDRIVER_PATH_ENV) {
            Ok(runtime_env) => runtime_env,
            Err(runtime_env_err) => match option_env!("WEBDRIVER_DOWNLOAD_PATH") {
                Some(compile_time_path) => compile_time_path.to_string(),
                None => {
                    debug!("{WEBDRIVER_PATH_ENV}: {runtime_env_err}");
                    warn!("Use the plotly_static's `webdriver_download` feature to automatically download, install and use the the chosen WebDriver for supported platforms. Or manually set {WEBDRIVER_PATH_ENV} to point to the WebDriver binary.");
                    return Err(anyhow!(
                        "WebDriver binary not available. Set {} environment variable or use the webdriver_download feature",
                        WEBDRIVER_PATH_ENV
        Self::full_path(&path).map_err(|e| anyhow!("Invalid WebDriver path '{}': {}", path, e))
    fn full_path(path: &str) -> Result<PathBuf> {
        let p = PathBuf::from(path);
        if !p.exists() {
            Err(anyhow!(
                "WebDriver executable not found at provided path: '{}'",
                p.display()
        } else {
            Ok(p)
Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

webdriver.rs

Latest commit

History

webdriver.rs

File metadata and controls