RA.Aid/ra_aid/proc/interactive.py

#!/usr/bin/env python3
"""
Module for running interactive subprocesses with output capture,
with full raw input passthrough for interactive commands.

It uses a pseudo-tty and integrates pyte's HistoryScreen to simulate
a terminal and capture the final scrollback history (non-blank lines).
The interface remains compatible with external callers expecting a tuple (output, return_code),
where output is a bytes object (UTF-8 encoded).
"""

import errno
import io
import os
import select
import shutil
import signal
import subprocess
import sys
import threading
import time
from typing import List, Tuple, Optional, Any

import pyte
from pyte.screens import HistoryScreen

# Import platform-specific modules
if sys.platform == "win32":
    import msvcrt
else:
    import termios
    import tty


def get_terminal_size() -> Tuple[int, int]:
    """
    Get the current terminal size in a cross-platform way.

    This function works on both Unix and Windows systems, using shutil.get_terminal_size()
    which is available in Python 3.3+. If the terminal size cannot be determined
    (e.g., when running in a non-interactive environment), it falls back to default values.

    Returns:
        A tuple of (columns, rows) representing the terminal dimensions.
    """
    try:
        size = shutil.get_terminal_size()
        return size.columns, size.lines
    except OSError:
        # Default fallback values
        return 80, 24


def create_process(cmd: List[str]) -> Tuple[subprocess.Popen, Any]:
    """
    Create a subprocess with appropriate platform-specific settings.

    This function handles the platform-specific differences between Windows and Unix:

    On Windows:
    - Creates a process with pipes for stdin/stdout
    - Uses STARTF_USESHOWWINDOW to prevent console windows from appearing
    - Returns the process and None (no PTY on Windows)

    On Unix:
    - Creates a pseudo-terminal (PTY) for full terminal emulation
    - Sets up non-blocking I/O on the master file descriptor
    - Configures environment variables for consistent behavior
    - Creates a new process group for proper signal handling

    Args:
        cmd: A list containing the command and its arguments.

    Returns:
        A tuple of (process, master_fd) where:
        - process is the subprocess.Popen object
        - master_fd is the master file descriptor (on Unix) or None (on Windows)
    """
    if sys.platform == "win32":
        # Windows-specific process creation
        startupinfo = subprocess.STARTUPINFO()
        startupinfo.dwFlags |= subprocess.STARTF_USESHOWWINDOW

        proc = subprocess.Popen(
            cmd,
            stdin=subprocess.PIPE,
            stdout=subprocess.PIPE,
            stderr=subprocess.STDOUT,
            bufsize=0,
            startupinfo=startupinfo
        )
        return proc, None
    else:
        # Unix-specific process creation with pty
        master_fd, slave_fd = os.openpty()
        os.set_blocking(master_fd, False)

        env = os.environ.copy()
        env.update({
            "DEBIAN_FRONTEND": "noninteractive",
            "GIT_PAGER": "",
            "PYTHONUNBUFFERED": "1",
            "CI": "true",
            "LANG": "C.UTF-8",
            "LC_ALL": "C.UTF-8",
            "COLUMNS": str(get_terminal_size()[0]),
            "LINES": str(get_terminal_size()[1]),
            "FORCE_COLOR": "1",
            "GIT_TERMINAL_PROMPT": "0",
            "PYTHONDONTWRITEBYTECODE": "1",
            "NODE_OPTIONS": "--unhandled-rejections=strict",
        })

        proc = subprocess.Popen(
            cmd,
            stdin=slave_fd,
            stdout=slave_fd,
            stderr=slave_fd,
            bufsize=0,
            close_fds=True,
            env=env,
            preexec_fn=os.setsid,  # Create new process group for proper signal handling.
        )
        os.close(slave_fd)  # Close slave end in the parent process.

        return proc, master_fd


def render_line(line, columns: int) -> str:
    """
    Render a single screen line from the pyte buffer.

    This function handles different types of line representations from pyte:
    - String lines (from screen.display)
    - Dictionary-style lines (from history, mapping column indices to Char objects)

    Args:
        line: A line from pyte's screen buffer (string or dict mapping column to Char)
        columns: Maximum number of columns to render

    Returns:
        A string representation of the line with proper character data
    """
    if not line:
        return ""

    # Handle string lines directly (from screen.display)
    if isinstance(line, str):
        return line

    # Handle dictionary-style lines (from history)
    try:
        max_col = max(line.keys()) if line else -1
        result = ""
        for x in range(min(columns, max_col + 1)):
            if x in line:
                result += line[x].data
        return result
    except (AttributeError, TypeError):
        # Fallback for any unexpected types
        return str(line)


def run_interactive_command(
    cmd: List[str], expected_runtime_seconds: int = 30
) -> Tuple[bytes, int]:
    """
    Runs an interactive command with output capture, capturing final scrollback history.

    This function provides a cross-platform way to run interactive commands with:
    - Full terminal emulation using pyte's HistoryScreen
    - Real-time display of command output
    - Input forwarding when running in an interactive terminal
    - Timeout handling to prevent runaway processes
    - Comprehensive output capture including ANSI escape sequences

    The implementation differs significantly between Windows and Unix:

    On Windows:
    - Uses threading to handle I/O operations
    - Relies on msvcrt for keyboard input detection
    - Uses pipes for process communication

    On Unix:
    - Uses pseudo-terminals (PTY) for full terminal emulation
    - Uses select() for non-blocking I/O
    - Handles raw terminal mode for proper input forwarding
    - Uses process groups for proper signal handling

    Args:
      cmd: A list containing the command and its arguments.
      expected_runtime_seconds: Expected runtime in seconds, defaults to 30.
        If process exceeds 2x this value, it will be terminated gracefully.
        If process exceeds 3x this value, it will be killed forcefully.
        Must be between 1 and 1800 seconds (30 minutes).

    Returns:
      A tuple of (captured_output, return_code), where captured_output is a UTF-8 encoded
      bytes object containing the trimmed non-empty history lines from the terminal session.

    Raises:
      ValueError: If no command is provided.
      FileNotFoundError: If the command is not found in PATH.
      ValueError: If expected_runtime_seconds is less than or equal to 0 or greater than 1800.
      RuntimeError: If an error occurs during execution.
    """
    if not cmd:
        raise ValueError("No command provided.")
    if shutil.which(cmd[0]) is None:
        raise FileNotFoundError(f"Command '{cmd[0]}' not found in PATH.")
    if expected_runtime_seconds <= 0 or expected_runtime_seconds > 1800:
        raise ValueError(
            "expected_runtime_seconds must be between 1 and 1800 seconds (30 minutes)"
        )

    cols, rows = get_terminal_size()

    # Set up pyte screen and stream to capture terminal output.
    # Increase history size to capture more lines (from 2000 to 5000)
    screen = HistoryScreen(cols, rows, history=5000, ratio=0.8)
    stream = pyte.Stream(screen)

    # Create process with platform-specific settings
    proc, master_fd = create_process(cmd)

    captured_data = []
    start_time = time.time()
    was_terminated = False

    def check_timeout():
        """
        Check if the process has exceeded its timeout limits and terminate if necessary.

        Returns:
            True if the process was terminated due to timeout, False otherwise.
        """
        elapsed = time.time() - start_time
        if sys.platform == "win32":
            # Windows process termination
            if elapsed > 3 * expected_runtime_seconds:
                # Hard kill after 3x the expected time
                proc.kill()
                return True
            elif elapsed > 2 * expected_runtime_seconds:
                # Graceful termination after 2x the expected time
                proc.terminate()
                return True
        else:
            # Unix process termination (using process groups)
            if elapsed > 3 * expected_runtime_seconds:
                # Hard kill with SIGKILL after 3x the expected time
                os.killpg(os.getpgid(proc.pid), signal.SIGKILL)
                return True
            elif elapsed > 2 * expected_runtime_seconds:
                # Graceful termination with SIGTERM after 2x the expected time
                os.killpg(os.getpgid(proc.pid), signal.SIGTERM)
                return True
        return False

    # Windows implementation
    if sys.platform == "win32":
        try:
            stdin_fd = None
            if sys.stdin and sys.stdin.isatty():
                try:
                    stdin_fd = sys.stdin.fileno()
                except (AttributeError, io.UnsupportedOperation):
                    stdin_fd = None

            # Function to read output from the process
            def read_output():
                """
                Thread function to continuously read and process output from the subprocess.

                This function:
                1. Reads data from the process stdout in chunks
                2. Adds the data to captured_data for later processing
                3. Feeds the data to the terminal emulator (pyte)
                4. Writes the data to stdout for real-time display
                5. Handles process termination and cleanup
                """
                while proc.poll() is None:
                    try:
                        data = proc.stdout.read(1024)
                        if not data:
                            break
                        captured_data.append(data)
                        decoded = data.decode("utf-8", errors="ignore")
                        stream.feed(decoded)
                        # Write to stdout for real-time display
                        try:
                            sys.stdout.buffer.write(data)
                            sys.stdout.buffer.flush()
                        except (OSError, IOError):
                            pass  # Ignore errors writing to stdout
                    except (OSError, IOError):
                        break
                    except Exception as e:
                        print(f"Error reading output: {e}", file=sys.stderr)
                        break

                # Try to read any remaining data after process ends
                try:
                    remaining = proc.stdout.read()
                    if remaining:
                        captured_data.append(remaining)
                        stream.feed(remaining.decode("utf-8", errors="ignore"))
                except Exception:
                    pass

            # Start a thread to read output
            output_thread = threading.Thread(target=read_output)
            output_thread.daemon = True
            output_thread.start()

            # Main loop for input and timeout checking
            while proc.poll() is None:
                if check_timeout():
                    was_terminated = True
                    break

                # Check for input if we have a TTY
                if stdin_fd is not None and msvcrt.kbhit():
                    try:
                        char = msvcrt.getch()
                        proc.stdin.write(char)
                        proc.stdin.flush()
                    except (OSError, IOError):
                        break

                time.sleep(0.1)  # Small sleep to prevent CPU hogging

            # Wait for the output thread to finish
            output_thread.join(timeout=1.0)

        except KeyboardInterrupt:
            proc.terminate()
        finally:
            if proc.stdin:
                proc.stdin.close()
            if proc.stdout:
                proc.stdout.close()

    # Unix implementation
    else:
        try:
            stdin_fd = None
            try:
                stdin_fd = sys.stdin.fileno()
            except (AttributeError, io.UnsupportedOperation):
                stdin_fd = None

            # Interactive mode: forward input if running in a TTY.
            if stdin_fd is not None and sys.stdin.isatty():
                old_settings = termios.tcgetattr(stdin_fd)
                tty.setraw(stdin_fd)
                try:
                    while True:
                        if check_timeout():
                            was_terminated = True
                            break
                        # Use a finite timeout to avoid indefinite blocking.
                        rlist, _, _ = select.select([master_fd, stdin_fd], [], [], 1.0)
                        if master_fd in rlist:
                            try:
                                data = os.read(master_fd, 1024)
                            except OSError as e:
                                if e.errno == errno.EIO:
                                    break
                                else:
                                    raise
                            if not data:  # EOF detected.
                                break
                            captured_data.append(data)
                            decoded = data.decode("utf-8", errors="ignore")
                            stream.feed(decoded)
                            os.write(1, data)
                        if stdin_fd in rlist:
                            try:
                                input_data = os.read(stdin_fd, 1024)
                            except OSError:
                                input_data = b""
                            if input_data:
                                os.write(master_fd, input_data)
                except KeyboardInterrupt:
                    proc.terminate()
                finally:
                    termios.tcsetattr(stdin_fd, termios.TCSADRAIN, old_settings)
            else:
                # Non-interactive mode.
                try:
                    while True:
                        if check_timeout():
                            was_terminated = True
                            break
                        rlist, _, _ = select.select([master_fd], [], [], 1.0)
                        if not rlist:
                            continue
                        try:
                            data = os.read(master_fd, 1024)
                        except OSError as e:
                            if e.errno == errno.EIO:
                                break
                            else:
                                raise
                        if not data:  # EOF detected.
                            break
                        captured_data.append(data)
                        decoded = data.decode("utf-8", errors="ignore")
                        stream.feed(decoded)
                        try:
                            os.write(1, data)
                        except (OSError, IOError):
                            pass  # Ignore errors writing to stdout
                except KeyboardInterrupt:
                    proc.terminate()

            os.close(master_fd)
        except Exception as e:
            print(f"Error in Unix implementation: {e}", file=sys.stderr)

    # Wait for the process to finish
    proc.wait()

    # Ensure we have captured data even if the screen processing failed
    raw_output = b"".join(captured_data)

    # Try to assemble full scrollback from the terminal emulation
    try:
        # Assemble full scrollback: combine history.top, the current display, and history.bottom.
        top_lines = []
        display_lines = []
        bottom_lines = []

        # Safely extract history.top (scrollback buffer above visible area)
        if hasattr(screen, 'history') and hasattr(screen.history, 'top'):
            top_lines = [render_line(line, cols) for line in screen.history.top]

        # Safely extract current display (visible terminal area)
        if hasattr(screen, 'display'):
            display_lines = [render_line(line, cols) for line in screen.display]

        # Safely extract history.bottom (scrollback buffer below visible area)
        if hasattr(screen, 'history') and hasattr(screen.history, 'bottom'):
            bottom_lines = [render_line(line, cols) for line in screen.history.bottom]

        # Combine all lines to get the complete terminal history
        all_lines = top_lines + display_lines + bottom_lines

        # Trim out empty lines to get only meaningful "history" lines
        # This is important for commands that don't fill the entire terminal
        trimmed_lines = [line for line in all_lines if line and line.strip()]

        # IMPORTANT: Always check if we have meaningful content from the screen
        if trimmed_lines and any(line.strip() for line in trimmed_lines):
            final_output = "\n".join(trimmed_lines)
        else:
            # Fall back to raw output if no meaningful lines from screen
            # This is critical for simple commands like "echo hello world"
            raw_decoded = raw_output.decode('utf-8', errors='replace')
            final_output = raw_decoded.strip()

            # If raw output is also empty, try to extract any content from the screen
            if not final_output and display_lines:
                final_output = "\n".join(display_lines)
    except Exception as e:
        # If anything goes wrong with screen processing, fall back to raw output
        print(f"Warning: Error processing terminal output: {e}", file=sys.stderr)
        final_output = raw_output.decode('utf-8', errors='replace').strip()

    # Add timeout message if process was terminated due to timeout.
    if was_terminated:
        timeout_msg = f"\n[Process exceeded timeout ({expected_runtime_seconds} seconds expected)]"
        final_output += timeout_msg

    # Limit output to the last 8000 bytes, but try to keep complete lines
    # This ensures we don't exceed memory limits while preserving readable output
    if len(final_output) > 8000:
        # Find a newline near the 8000-byte cutoff point
        cutoff = max(0, len(final_output) - 8000)
        # Try to find a newline after the cutoff to avoid cutting in the middle of a line
        newline_pos = final_output.find('\n', cutoff)
        if newline_pos != -1 and newline_pos < cutoff + 200:  # Don't look too far ahead
            cutoff = newline_pos + 1
        final_output = final_output[cutoff:]

    # Ensure we're returning bytes with consistent encoding
    if isinstance(final_output, str):
        # Make sure we have content in the final output
        if not final_output.strip() and raw_output:
            # Fall back to raw output if processed output is empty
            final_output = raw_output.decode('utf-8', errors='replace').strip()
        final_output = final_output.encode("utf-8")
    elif not isinstance(final_output, bytes):
        # Handle any unexpected type by converting to string and then bytes
        final_output = str(final_output).encode("utf-8")

    # Ensure we have at least some output, even if the command produced none
    # This is important for error reporting and debugging
    if not final_output or final_output.strip() == b"":
        # Last resort: use raw output directly
        if raw_output:
            final_output = raw_output
        else:
            final_output = b"[No output captured]"

    return final_output, proc.returncode


if __name__ == "__main__":
    import sys

    if len(sys.argv) < 2:
        print("Usage: interactive.py <command> [args...]")
        sys.exit(1)
    output, return_code = run_interactive_command(sys.argv[1:])
    sys.exit(return_code)