improve interactive history capture

2025-02-25 14:02:43 -05:00 · 2025-02-25 14:02:43 -05:00 · f14863a06d
parent a866b38883
commit f14863a06d
1 changed files with 114 additions and 338 deletions
--- a/ra_aid/proc/interactive.py
+++ b/ra_aid/proc/interactive.py
@ -17,19 +17,14 @@ import shutil
 import signal
 import subprocess
 import sys
 import threading
 import time
-from typing import List, Tuple, Optional, Any
+from typing import List, Tuple
 import pyte
 from pyte.screens import HistoryScreen
-# Import platform-specific modules
+import termios
-if sys.platform == "win32":
+import tty
    import msvcrt
 else:
    import termios
    import tty
 def get_terminal_size() -> Tuple[int, int]:
@ -51,96 +46,8 @@ def get_terminal_size() -> Tuple[int, int]:
        return 80, 24
 def create_process(cmd: List[str]) -> Tuple[subprocess.Popen, Any]:
    """
    Create a subprocess with appropriate platform-specific settings.
    This function handles the platform-specific differences between Windows and Unix:
    On Windows:
    - Creates a process with pipes for stdin/stdout
    - Uses STARTF_USESHOWWINDOW to prevent console windows from appearing
    - Returns the process and None (no PTY on Windows)
    On Unix:
    - Creates a pseudo-terminal (PTY) for full terminal emulation
    - Sets up non-blocking I/O on the master file descriptor
    - Configures environment variables for consistent behavior
    - Creates a new process group for proper signal handling
    Args:
        cmd: A list containing the command and its arguments.
    Returns:
        A tuple of (process, master_fd) where:
        - process is the subprocess.Popen object
        - master_fd is the master file descriptor (on Unix) or None (on Windows)
    """
    if sys.platform == "win32":
        # Windows-specific process creation
        startupinfo = subprocess.STARTUPINFO()
        startupinfo.dwFlags |= subprocess.STARTF_USESHOWWINDOW
        proc = subprocess.Popen(
            cmd,
            stdin=subprocess.PIPE,
            stdout=subprocess.PIPE,
            stderr=subprocess.STDOUT,
            bufsize=0,
            startupinfo=startupinfo
        )
        return proc, None
    else:
        # Unix-specific process creation with pty
        master_fd, slave_fd = os.openpty()
        os.set_blocking(master_fd, False)
        env = os.environ.copy()
        env.update({
            "DEBIAN_FRONTEND": "noninteractive",
            "GIT_PAGER": "",
            "PYTHONUNBUFFERED": "1",
            "CI": "true",
            "LANG": "C.UTF-8",
            "LC_ALL": "C.UTF-8",
            "COLUMNS": str(get_terminal_size()[0]),
            "LINES": str(get_terminal_size()[1]),
            "FORCE_COLOR": "1",
            "GIT_TERMINAL_PROMPT": "0",
            "PYTHONDONTWRITEBYTECODE": "1",
            "NODE_OPTIONS": "--unhandled-rejections=strict",
        })
        proc = subprocess.Popen(
            cmd,
            stdin=slave_fd,
            stdout=slave_fd,
            stderr=slave_fd,
            bufsize=0,
            close_fds=True,
            env=env,
            preexec_fn=os.setsid,  # Create new process group for proper signal handling.
        )
        os.close(slave_fd)  # Close slave end in the parent process.
        return proc, master_fd
 def render_line(line, columns: int) -> str:
-    """
+    """Render a single screen line from the pyte buffer (a mapping of column to Char)."""
    Render a single screen line from the pyte buffer.
    This function handles different types of line representations from pyte:
    - String lines (from screen.display)
    - Dictionary-style lines (from history, mapping column indices to Char objects)
    Args:
        line: A line from pyte's screen buffer (string or dict mapping column to Char)
        columns: Maximum number of columns to render
    Returns:
        A string representation of the line with proper character data
    """
    if not line:
        return ""
@ -150,12 +57,7 @@ def render_line(line, columns: int) -> str:
    # Handle dictionary-style lines (from history)
    try:
-        max_col = max(line.keys()) if line else -1
+        return "".join(line[x].data for x in range(columns) if x in line)
        result = ""
        for x in range(min(columns, max_col + 1)):
            if x in line:
                result += line[x].data
        return result
    except (AttributeError, TypeError):
        # Fallback for any unexpected types
        return str(line)
@ -216,208 +118,127 @@ def run_interactive_command(
    cols, rows = get_terminal_size()
    # Set up pyte screen and stream to capture terminal output.
-    # Increase history size to capture more lines (from 2000 to 5000)
+    screen = HistoryScreen(cols, rows, history=2000, ratio=0.5)
    screen = HistoryScreen(cols, rows, history=5000, ratio=0.8)
    stream = pyte.Stream(screen)
-    # Create process with platform-specific settings
+    # Open a new pseudo-tty.
-    proc, master_fd = create_process(cmd)
+    master_fd, slave_fd = os.openpty()
    # Set master_fd to non-blocking to avoid indefinite blocking.
    os.set_blocking(master_fd, False)
    try:
        stdin_fd = sys.stdin.fileno()
    except (AttributeError, io.UnsupportedOperation):
        stdin_fd = None
    # Set up environment variables for the subprocess using detected terminal size.
    env = os.environ.copy()
    env.update(
        {
            "DEBIAN_FRONTEND": "noninteractive",
            "GIT_PAGER": "",
            "PYTHONUNBUFFERED": "1",
            "CI": "true",
            "LANG": "C.UTF-8",
            "LC_ALL": "C.UTF-8",
            "COLUMNS": str(cols),
            "LINES": str(rows),
            "FORCE_COLOR": "1",
            "GIT_TERMINAL_PROMPT": "0",
            "PYTHONDONTWRITEBYTECODE": "1",
            "NODE_OPTIONS": "--unhandled-rejections=strict",
        }
    )
    proc = subprocess.Popen(
        cmd,
        stdin=slave_fd,
        stdout=slave_fd,
        stderr=slave_fd,
        bufsize=0,
        close_fds=True,
        env=env,
        preexec_fn=os.setsid,  # Create new process group for proper signal handling.
    )
    os.close(slave_fd)  # Close slave end in the parent process.
    captured_data = []
    start_time = time.time()
    was_terminated = False
    def check_timeout():
        """
        Check if the process has exceeded its timeout limits and terminate if necessary.
        Returns:
            True if the process was terminated due to timeout, False otherwise.
        """
        elapsed = time.time() - start_time
-        if sys.platform == "win32":
+        if elapsed > 3 * expected_runtime_seconds:
-            # Windows process termination
+            os.killpg(os.getpgid(proc.pid), signal.SIGKILL)
-            if elapsed > 3 * expected_runtime_seconds:
+            return True
-                # Hard kill after 3x the expected time
+        elif elapsed > 2 * expected_runtime_seconds:
-                proc.kill()
+            os.killpg(os.getpgid(proc.pid), signal.SIGTERM)
-                return True
+            return True
            elif elapsed > 2 * expected_runtime_seconds:
                # Graceful termination after 2x the expected time
                proc.terminate()
                return True
        else:
            # Unix process termination (using process groups)
            if elapsed > 3 * expected_runtime_seconds:
                # Hard kill with SIGKILL after 3x the expected time
                os.killpg(os.getpgid(proc.pid), signal.SIGKILL)
                return True
            elif elapsed > 2 * expected_runtime_seconds:
                # Graceful termination with SIGTERM after 2x the expected time
                os.killpg(os.getpgid(proc.pid), signal.SIGTERM)
                return True
        return False
-    # Windows implementation
+    # Interactive mode: forward input if running in a TTY.
-    if sys.platform == "win32":
+    if stdin_fd is not None and sys.stdin.isatty():
        old_settings = termios.tcgetattr(stdin_fd)
        tty.setraw(stdin_fd)
        try:
-            stdin_fd = None
+            while True:
            if sys.stdin and sys.stdin.isatty():
                try:
                    stdin_fd = sys.stdin.fileno()
                except (AttributeError, io.UnsupportedOperation):
                    stdin_fd = None
            # Function to read output from the process
            def read_output():
                """
                Thread function to continuously read and process output from the subprocess.
                This function:
                1. Reads data from the process stdout in chunks
                2. Adds the data to captured_data for later processing
                3. Feeds the data to the terminal emulator (pyte)
                4. Writes the data to stdout for real-time display
                5. Handles process termination and cleanup
                """
                while proc.poll() is None:
                    try:
                        data = proc.stdout.read(1024)
                        if not data:
                            break
                        captured_data.append(data)
                        decoded = data.decode("utf-8", errors="ignore")
                        stream.feed(decoded)
                        # Write to stdout for real-time display
                        try:
                            sys.stdout.buffer.write(data)
                            sys.stdout.buffer.flush()
                        except (OSError, IOError):
                            pass  # Ignore errors writing to stdout
                    except (OSError, IOError):
                        break
                    except Exception as e:
                        print(f"Error reading output: {e}", file=sys.stderr)
                        break
                # Try to read any remaining data after process ends
                try:
                    remaining = proc.stdout.read()
                    if remaining:
                        captured_data.append(remaining)
                        stream.feed(remaining.decode("utf-8", errors="ignore"))
                except Exception:
                    pass
            # Start a thread to read output
            output_thread = threading.Thread(target=read_output)
            output_thread.daemon = True
            output_thread.start()
            # Main loop for input and timeout checking
            while proc.poll() is None:
                if check_timeout():
                    was_terminated = True
                    break
-
+                # Use a finite timeout to avoid indefinite blocking.
-                # Check for input if we have a TTY
+                rlist, _, _ = select.select([master_fd, stdin_fd], [], [], 1.0)
-                if stdin_fd is not None and msvcrt.kbhit():
+                if master_fd in rlist:
                    try:
-                        char = msvcrt.getch()
+                        data = os.read(master_fd, 1024)
-                        proc.stdin.write(char)
+                    except OSError as e:
-                        proc.stdin.flush()
+                        if e.errno == errno.EIO:
-                    except (OSError, IOError):
+                            break
                        else:
                            raise
                    if not data:  # EOF detected.
                        break
-
+                    captured_data.append(data)
-                time.sleep(0.1)  # Small sleep to prevent CPU hogging
+                    decoded = data.decode("utf-8", errors="ignore")
-
+                    stream.feed(decoded)
-            # Wait for the output thread to finish
+                    os.write(1, data)
-            output_thread.join(timeout=1.0)
+                if stdin_fd in rlist:
-
+                    try:
                        input_data = os.read(stdin_fd, 1024)
                    except OSError:
                        input_data = b""
                    if input_data:
                        os.write(master_fd, input_data)
        except KeyboardInterrupt:
            proc.terminate()
        finally:
-            if proc.stdin:
+            termios.tcsetattr(stdin_fd, termios.TCSADRAIN, old_settings)
                proc.stdin.close()
            if proc.stdout:
                proc.stdout.close()
    # Unix implementation
    else:
        # Non-interactive mode.
        try:
-            stdin_fd = None
+            while True:
-            try:
+                if check_timeout():
-                stdin_fd = sys.stdin.fileno()
+                    was_terminated = True
-            except (AttributeError, io.UnsupportedOperation):
+                    break
-                stdin_fd = None
+                rlist, _, _ = select.select([master_fd], [], [], 1.0)
-
+                if not rlist:
-            # Interactive mode: forward input if running in a TTY.
+                    continue
            if stdin_fd is not None and sys.stdin.isatty():
                old_settings = termios.tcgetattr(stdin_fd)
                tty.setraw(stdin_fd)
                try:
-                    while True:
+                    data = os.read(master_fd, 1024)
-                        if check_timeout():
+                except OSError as e:
-                            was_terminated = True
+                    if e.errno == errno.EIO:
-                            break
+                        break
-                        # Use a finite timeout to avoid indefinite blocking.
+                    else:
-                        rlist, _, _ = select.select([master_fd, stdin_fd], [], [], 1.0)
+                        raise
-                        if master_fd in rlist:
+                if not data:  # EOF detected.
-                            try:
+                    break
-                                data = os.read(master_fd, 1024)
+                captured_data.append(data)
-                            except OSError as e:
+                decoded = data.decode("utf-8", errors="ignore")
-                                if e.errno == errno.EIO:
+                stream.feed(decoded)
-                                    break
+                os.write(1, data)
-                                else:
+        except KeyboardInterrupt:
-                                    raise
+            proc.terminate()
                            if not data:  # EOF detected.
                                break
                            captured_data.append(data)
                            decoded = data.decode("utf-8", errors="ignore")
                            stream.feed(decoded)
                            os.write(1, data)
                        if stdin_fd in rlist:
                            try:
                                input_data = os.read(stdin_fd, 1024)
                            except OSError:
                                input_data = b""
                            if input_data:
                                os.write(master_fd, input_data)
                except KeyboardInterrupt:
                    proc.terminate()
                finally:
                    termios.tcsetattr(stdin_fd, termios.TCSADRAIN, old_settings)
            else:
                # Non-interactive mode.
                try:
                    while True:
                        if check_timeout():
                            was_terminated = True
                            break
                        rlist, _, _ = select.select([master_fd], [], [], 1.0)
                        if not rlist:
                            continue
                        try:
                            data = os.read(master_fd, 1024)
                        except OSError as e:
                            if e.errno == errno.EIO:
                                break
                            else:
                                raise
                        if not data:  # EOF detected.
                            break
                        captured_data.append(data)
                        decoded = data.decode("utf-8", errors="ignore")
                        stream.feed(decoded)
                        try:
                            os.write(1, data)
                        except (OSError, IOError):
                            pass  # Ignore errors writing to stdout
                except KeyboardInterrupt:
                    proc.terminate()
-            os.close(master_fd)
+    os.close(master_fd)
        except Exception as e:
            print(f"Error in Unix implementation: {e}", file=sys.stderr)
    # Wait for the process to finish
    proc.wait()
@ -425,44 +246,20 @@ def run_interactive_command(
    # Ensure we have captured data even if the screen processing failed
    raw_output = b"".join(captured_data)
-    # Try to assemble full scrollback from the terminal emulation
+    # Assemble full scrollback from the terminal emulation
    try:
        # Assemble full scrollback: combine history.top, the current display, and history.bottom.
-        top_lines = []
+        top_lines = [render_line(line, cols) for line in screen.history.top]
-        display_lines = []
+        display_lines = [render_line(line, cols) for line in screen.display]
-        bottom_lines = []
+        bottom_lines = [render_line(line, cols) for line in screen.history.bottom]
        # Safely extract history.top (scrollback buffer above visible area)
        if hasattr(screen, 'history') and hasattr(screen.history, 'top'):
            top_lines = [render_line(line, cols) for line in screen.history.top]
        # Safely extract current display (visible terminal area)
        if hasattr(screen, 'display'):
            display_lines = [render_line(line, cols) for line in screen.display]
        # Safely extract history.bottom (scrollback buffer below visible area)
        if hasattr(screen, 'history') and hasattr(screen.history, 'bottom'):
            bottom_lines = [render_line(line, cols) for line in screen.history.bottom]
        # Combine all lines to get the complete terminal history
        all_lines = top_lines + display_lines + bottom_lines
        # Trim out empty lines to get only meaningful "history" lines
        # This is important for commands that don't fill the entire terminal
        trimmed_lines = [line for line in all_lines if line and line.strip()]
-        # IMPORTANT: Always check if we have meaningful content from the screen
+        final_output = "\n".join(trimmed_lines)
        if trimmed_lines and any(line.strip() for line in trimmed_lines):
            final_output = "\n".join(trimmed_lines)
        else:
            # Fall back to raw output if no meaningful lines from screen
            # This is critical for simple commands like "echo hello world"
            raw_decoded = raw_output.decode('utf-8', errors='replace')
            final_output = raw_decoded.strip()
            # If raw output is also empty, try to extract any content from the screen
            if not final_output and display_lines:
                final_output = "\n".join(display_lines)
    except Exception as e:
        # If anything goes wrong with screen processing, fall back to raw output
        print(f"Warning: Error processing terminal output: {e}", file=sys.stderr)
@ -473,36 +270,15 @@ def run_interactive_command(
        timeout_msg = f"\n[Process exceeded timeout ({expected_runtime_seconds} seconds expected)]"
        final_output += timeout_msg
-    # Limit output to the last 8000 bytes, but try to keep complete lines
+    # Limit output to the last 8000 bytes
    # This ensures we don't exceed memory limits while preserving readable output
    if len(final_output) > 8000:
        # Find a newline near the 8000-byte cutoff point
        cutoff = max(0, len(final_output) - 8000)
        # Try to find a newline after the cutoff to avoid cutting in the middle of a line
        newline_pos = final_output.find('\n', cutoff)
        if newline_pos != -1 and newline_pos < cutoff + 200:  # Don't look too far ahead
            cutoff = newline_pos + 1
        final_output = final_output[cutoff:]
    # Ensure we're returning bytes with consistent encoding
    if isinstance(final_output, str):
-        # Make sure we have content in the final output
+        final_output = final_output[-8000:]
        if not final_output.strip() and raw_output:
            # Fall back to raw output if processed output is empty
            final_output = raw_output.decode('utf-8', errors='replace').strip()
        final_output = final_output.encode("utf-8")
-    elif not isinstance(final_output, bytes):
+    elif isinstance(final_output, bytes):
-        # Handle any unexpected type by converting to string and then bytes
+        final_output = final_output[-8000:]
-        final_output = str(final_output).encode("utf-8")
+    else:
-        
+        # Handle any unexpected type
-    # Ensure we have at least some output, even if the command produced none
+        final_output = str(final_output)[-8000:].encode("utf-8")
    # This is important for error reporting and debugging
    if not final_output or final_output.strip() == b"":
        # Last resort: use raw output directly
        if raw_output:
            final_output = raw_output
        else:
            final_output = b"[No output captured]"
    return final_output, proc.returncode