RA.Aid/ra_aid/tools/read_file.py

72 lines
2.0 KiB
Python

import logging
import os.path
import time
from typing import Dict
from langchain_core.tools import tool
from rich.console import Console
from rich.panel import Panel
from ra_aid.text.processing import truncate_output
console = Console()
# Standard buffer size for file reading
CHUNK_SIZE = 8192
@tool
def read_file_tool(filepath: str, encoding: str = "utf-8") -> Dict[str, str]:
"""Read and return the contents of a text file.
Args:
filepath: Path to the file to read
encoding: File encoding to use (default: utf-8)
"""
start_time = time.time()
try:
if not os.path.exists(filepath):
raise FileNotFoundError(f"File not found: {filepath}")
logging.debug(f"Starting to read file: {filepath}")
content = []
line_count = 0
total_bytes = 0
with open(filepath, "r", encoding=encoding) as f:
while True:
chunk = f.read(CHUNK_SIZE)
if not chunk:
break
content.append(chunk)
total_bytes += len(chunk)
line_count += chunk.count("\n")
logging.debug(
f"Read chunk: {len(chunk)} bytes, running total: {total_bytes} bytes"
)
full_content = "".join(content)
elapsed = time.time() - start_time
logging.debug(f"File read complete: {total_bytes} bytes in {elapsed:.2f}s")
logging.debug(f"Pre-truncation stats: {total_bytes} bytes, {line_count} lines")
console.print(
Panel(
f"Read {line_count} lines ({total_bytes} bytes) from {filepath} in {elapsed:.2f}s",
title="📄 File Read",
border_style="bright_blue",
)
)
# Truncate if needed
truncated = truncate_output(full_content) if full_content else ""
return {"content": truncated}
except Exception:
elapsed = time.time() - start_time
raise