tool/str_replace_editor.py · Speedofmastery/yyuu at main

yyuu / tool /str_replace_editor.py

Upload folder using huggingface_hub

262f6b3 verified 4 months ago

17.1 kB

	"""File and directory manipulation tool with sandbox support."""

	from collections import defaultdict
	from pathlib import Path
	from typing import Any, DefaultDict, List, Literal, Optional, get_args

	from app.config import config
	from app.exceptions import ToolError
	from app.tool import BaseTool
	from app.tool.base import CLIResult, ToolResult
	from app.tool.file_operators import (
	FileOperator,
	LocalFileOperator,
	PathLike,
	SandboxFileOperator,
	)


	Command = Literal[
	"view",
	"create",
	"str_replace",
	"insert",
	"undo_edit",
	]

	# Constants
	SNIPPET_LINES: int = 4
	MAX_RESPONSE_LEN: int = 16000
	TRUNCATED_MESSAGE: str = (
	"<response clipped><NOTE>To save on context only part of this file has been shown to you. "
	"You should retry this tool after you have searched inside the file with `grep -n` "
	"in order to find the line numbers of what you are looking for.</NOTE>"
	)

	# Tool description
	_STR_REPLACE_EDITOR_DESCRIPTION = """Custom editing tool for viewing, creating and editing files
	* State is persistent across command calls and discussions with the user
	* If `path` is a file, `view` displays the result of applying `cat -n`. If `path` is a directory, `view` lists non-hidden files and directories up to 2 levels deep
	* The `create` command cannot be used if the specified `path` already exists as a file
	* If a `command` generates a long output, it will be truncated and marked with `<response clipped>`
	* The `undo_edit` command will revert the last edit made to the file at `path`

	Notes for using the `str_replace` command:
	* The `old_str` parameter should match EXACTLY one or more consecutive lines from the original file. Be mindful of whitespaces!
	* If the `old_str` parameter is not unique in the file, the replacement will not be performed. Make sure to include enough context in `old_str` to make it unique
	* The `new_str` parameter should contain the edited lines that should replace the `old_str`
	"""


	def maybe_truncate(
	content: str, truncate_after: Optional[int] = MAX_RESPONSE_LEN
	) -> str:
	"""Truncate content and append a notice if content exceeds the specified length."""
	if not truncate_after or len(content) <= truncate_after:
	return content
	return content[:truncate_after] + TRUNCATED_MESSAGE


	class StrReplaceEditor(BaseTool):
	"""A tool for viewing, creating, and editing files with sandbox support."""

	name: str = "str_replace_editor"
	description: str = _STR_REPLACE_EDITOR_DESCRIPTION
	parameters: dict = {
	"type": "object",
	"properties": {
	"command": {
	"description": "The commands to run. Allowed options are: `view`, `create`, `str_replace`, `insert`, `undo_edit`.",
	"enum": ["view", "create", "str_replace", "insert", "undo_edit"],
	"type": "string",
	},
	"path": {
	"description": "Absolute path to file or directory.",
	"type": "string",
	},
	"file_text": {
	"description": "Required parameter of `create` command, with the content of the file to be created.",
	"type": "string",
	},
	"old_str": {
	"description": "Required parameter of `str_replace` command containing the string in `path` to replace.",
	"type": "string",
	},
	"new_str": {
	"description": "Optional parameter of `str_replace` command containing the new string (if not given, no string will be added). Required parameter of `insert` command containing the string to insert.",
	"type": "string",
	},
	"insert_line": {
	"description": "Required parameter of `insert` command. The `new_str` will be inserted AFTER the line `insert_line` of `path`.",
	"type": "integer",
	},
	"view_range": {
	"description": "Optional parameter of `view` command when `path` points to a file. If none is given, the full file is shown. If provided, the file will be shown in the indicated line number range, e.g. [11, 12] will show lines 11 and 12. Indexing at 1 to start. Setting `[start_line, -1]` shows all lines from `start_line` to the end of the file.",
	"items": {"type": "integer"},
	"type": "array",
	},
	},
	"required": ["command", "path"],
	}
	_file_history: DefaultDict[PathLike, List[str]] = defaultdict(list)
	_local_operator: LocalFileOperator = LocalFileOperator()
	_sandbox_operator: SandboxFileOperator = SandboxFileOperator()

	# def _get_operator(self, use_sandbox: bool) -> FileOperator:
	def _get_operator(self) -> FileOperator:
	"""Get the appropriate file operator based on execution mode."""
	return (
	self._sandbox_operator
	if config.sandbox.use_sandbox
	else self._local_operator
	)

	async def execute(
	self,
	*,
	command: Command,
	path: str,
	file_text: str \| None = None,
	view_range: list[int] \| None = None,
	old_str: str \| None = None,
	new_str: str \| None = None,
	insert_line: int \| None = None,
	**kwargs: Any,
	) -> str:
	"""Execute a file operation command."""
	# Get the appropriate file operator
	operator = self._get_operator()

	# Validate path and command combination
	await self.validate_path(command, Path(path), operator)

	# Execute the appropriate command
	if command == "view":
	result = await self.view(path, view_range, operator)
	elif command == "create":
	if file_text is None:
	raise ToolError("Parameter `file_text` is required for command: create")
	await operator.write_file(path, file_text)
	self._file_history[path].append(file_text)
	result = ToolResult(output=f"File created successfully at: {path}")
	elif command == "str_replace":
	if old_str is None:
	raise ToolError(
	"Parameter `old_str` is required for command: str_replace"
	)
	result = await self.str_replace(path, old_str, new_str, operator)
	elif command == "insert":
	if insert_line is None:
	raise ToolError(
	"Parameter `insert_line` is required for command: insert"
	)
	if new_str is None:
	raise ToolError("Parameter `new_str` is required for command: insert")
	result = await self.insert(path, insert_line, new_str, operator)
	elif command == "undo_edit":
	result = await self.undo_edit(path, operator)
	else:
	# This should be caught by type checking, but we include it for safety
	raise ToolError(
	f'Unrecognized command {command}. The allowed commands for the {self.name} tool are: {", ".join(get_args(Command))}'
	)

	return str(result)

	async def validate_path(
	self, command: str, path: Path, operator: FileOperator
	) -> None:
	"""Validate path and command combination based on execution environment."""
	# Check if path is absolute
	if not path.is_absolute():
	raise ToolError(f"The path {path} is not an absolute path")

	# Only check if path exists for non-create commands
	if command != "create":
	if not await operator.exists(path):
	raise ToolError(
	f"The path {path} does not exist. Please provide a valid path."
	)

	# Check if path is a directory
	is_dir = await operator.is_directory(path)
	if is_dir and command != "view":
	raise ToolError(
	f"The path {path} is a directory and only the `view` command can be used on directories"
	)

	# Check if file exists for create command
	elif command == "create":
	exists = await operator.exists(path)
	if exists:
	raise ToolError(
	f"File already exists at: {path}. Cannot overwrite files using command `create`."
	)

	async def view(
	self,
	path: PathLike,
	view_range: Optional[List[int]] = None,
	operator: FileOperator = None,
	) -> CLIResult:
	"""Display file or directory content."""
	# Determine if path is a directory
	is_dir = await operator.is_directory(path)

	if is_dir:
	# Directory handling
	if view_range:
	raise ToolError(
	"The `view_range` parameter is not allowed when `path` points to a directory."
	)

	return await self._view_directory(path, operator)
	else:
	# File handling
	return await self._view_file(path, operator, view_range)

	@staticmethod
	async def _view_directory(path: PathLike, operator: FileOperator) -> CLIResult:
	"""Display directory contents."""
	find_cmd = f"find {path} -maxdepth 2 -not -path '/\\.'"

	# Execute command using the operator
	returncode, stdout, stderr = await operator.run_command(find_cmd)

	if not stderr:
	stdout = (
	f"Here's the files and directories up to 2 levels deep in {path}, "
	f"excluding hidden items:\n{stdout}\n"
	)

	return CLIResult(output=stdout, error=stderr)

	async def _view_file(
	self,
	path: PathLike,
	operator: FileOperator,
	view_range: Optional[List[int]] = None,
	) -> CLIResult:
	"""Display file content, optionally within a specified line range."""
	# Read file content
	file_content = await operator.read_file(path)
	init_line = 1

	# Apply view range if specified
	if view_range:
	if len(view_range) != 2 or not all(isinstance(i, int) for i in view_range):
	raise ToolError(
	"Invalid `view_range`. It should be a list of two integers."
	)

	file_lines = file_content.split("\n")
	n_lines_file = len(file_lines)
	init_line, final_line = view_range

	# Validate view range
	if init_line < 1 or init_line > n_lines_file:
	raise ToolError(
	f"Invalid `view_range`: {view_range}. Its first element `{init_line}` should be "
	f"within the range of lines of the file: {[1, n_lines_file]}"
	)
	if final_line > n_lines_file:
	raise ToolError(
	f"Invalid `view_range`: {view_range}. Its second element `{final_line}` should be "
	f"smaller than the number of lines in the file: `{n_lines_file}`"
	)
	if final_line != -1 and final_line < init_line:
	raise ToolError(
	f"Invalid `view_range`: {view_range}. Its second element `{final_line}` should be "
	f"larger or equal than its first `{init_line}`"
	)

	# Apply range
	if final_line == -1:
	file_content = "\n".join(file_lines[init_line - 1 :])
	else:
	file_content = "\n".join(file_lines[init_line - 1 : final_line])

	# Format and return result
	return CLIResult(
	output=self._make_output(file_content, str(path), init_line=init_line)
	)

	async def str_replace(
	self,
	path: PathLike,
	old_str: str,
	new_str: Optional[str] = None,
	operator: FileOperator = None,
	) -> CLIResult:
	"""Replace a unique string in a file with a new string."""
	# Read file content and expand tabs
	file_content = (await operator.read_file(path)).expandtabs()
	old_str = old_str.expandtabs()
	new_str = new_str.expandtabs() if new_str is not None else ""

	# Check if old_str is unique in the file
	occurrences = file_content.count(old_str)
	if occurrences == 0:
	raise ToolError(
	f"No replacement was performed, old_str `{old_str}` did not appear verbatim in {path}."
	)
	elif occurrences > 1:
	# Find line numbers of occurrences
	file_content_lines = file_content.split("\n")
	lines = [
	idx + 1
	for idx, line in enumerate(file_content_lines)
	if old_str in line
	]
	raise ToolError(
	f"No replacement was performed. Multiple occurrences of old_str `{old_str}` "
	f"in lines {lines}. Please ensure it is unique"
	)

	# Replace old_str with new_str
	new_file_content = file_content.replace(old_str, new_str)

	# Write the new content to the file
	await operator.write_file(path, new_file_content)

	# Save the original content to history
	self._file_history[path].append(file_content)

	# Create a snippet of the edited section
	replacement_line = file_content.split(old_str)[0].count("\n")
	start_line = max(0, replacement_line - SNIPPET_LINES)
	end_line = replacement_line + SNIPPET_LINES + new_str.count("\n")
	snippet = "\n".join(new_file_content.split("\n")[start_line : end_line + 1])

	# Prepare the success message
	success_msg = f"The file {path} has been edited. "
	success_msg += self._make_output(
	snippet, f"a snippet of {path}", start_line + 1
	)
	success_msg += "Review the changes and make sure they are as expected. Edit the file again if necessary."

	return CLIResult(output=success_msg)

	async def insert(
	self,
	path: PathLike,
	insert_line: int,
	new_str: str,
	operator: FileOperator = None,
	) -> CLIResult:
	"""Insert text at a specific line in a file."""
	# Read and prepare content
	file_text = (await operator.read_file(path)).expandtabs()
	new_str = new_str.expandtabs()
	file_text_lines = file_text.split("\n")
	n_lines_file = len(file_text_lines)

	# Validate insert_line
	if insert_line < 0 or insert_line > n_lines_file:
	raise ToolError(
	f"Invalid `insert_line` parameter: {insert_line}. It should be within "
	f"the range of lines of the file: {[0, n_lines_file]}"
	)

	# Perform insertion
	new_str_lines = new_str.split("\n")
	new_file_text_lines = (
	file_text_lines[:insert_line]
	+ new_str_lines
	+ file_text_lines[insert_line:]
	)

	# Create a snippet for preview
	snippet_lines = (
	file_text_lines[max(0, insert_line - SNIPPET_LINES) : insert_line]
	+ new_str_lines
	+ file_text_lines[insert_line : insert_line + SNIPPET_LINES]
	)

	# Join lines and write to file
	new_file_text = "\n".join(new_file_text_lines)
	snippet = "\n".join(snippet_lines)

	await operator.write_file(path, new_file_text)
	self._file_history[path].append(file_text)

	# Prepare success message
	success_msg = f"The file {path} has been edited. "
	success_msg += self._make_output(
	snippet,
	"a snippet of the edited file",
	max(1, insert_line - SNIPPET_LINES + 1),
	)
	success_msg += "Review the changes and make sure they are as expected (correct indentation, no duplicate lines, etc). Edit the file again if necessary."

	return CLIResult(output=success_msg)

	async def undo_edit(
	self, path: PathLike, operator: FileOperator = None
	) -> CLIResult:
	"""Revert the last edit made to a file."""
	if not self._file_history[path]:
	raise ToolError(f"No edit history found for {path}.")

	old_text = self._file_history[path].pop()
	await operator.write_file(path, old_text)

	return CLIResult(
	output=f"Last edit to {path} undone successfully. {self._make_output(old_text, str(path))}"
	)

	def _make_output(
	self,
	file_content: str,
	file_descriptor: str,
	init_line: int = 1,
	expand_tabs: bool = True,
	) -> str:
	"""Format file content for display with line numbers."""
	file_content = maybe_truncate(file_content)
	if expand_tabs:
	file_content = file_content.expandtabs()

	# Add line numbers to each line
	file_content = "\n".join(
	[
	f"{i + init_line:6}\t{line}"
	for i, line in enumerate(file_content.split("\n"))
	]
	)

	return (
	f"Here's the result of running `cat -n` on {file_descriptor}:\n"
	+ file_content
	+ "\n"
	)