Spaces:

Speedofmastery
/

orynxml-ai

Paused

App Files Files Community

orynxml-ai / app /tool /str_replace_editor.py

Speedofmastery

Upload folder using huggingface_hub

2f28b62 verified 10 days ago

raw

history blame contribute delete

17.1 kB

	"""File and directory manipulation tool with sandbox support."""

	from collections import defaultdict
	from pathlib import Path
	from typing import Any, DefaultDict, List, Literal, Optional, get_args

	from app.config import config
	from app.exceptions import ToolError
	from app.tool import BaseTool
	from app.tool.base import CLIResult, ToolResult
	from app.tool.file_operators import (
	FileOperator,
	LocalFileOperator,
	PathLike,
	SandboxFileOperator,
	)


	Command = Literal[
	"view",
	"create",
	"str_replace",
	"insert",
	"undo_edit",
	]

	# Constants
	SNIPPET_LINES: int = 4
	MAX_RESPONSE_LEN: int = 16000
	TRUNCATED_MESSAGE: str = (
	"<response clipped><NOTE>To save on context only part of this file has been shown to you. "
	"You should retry this tool after you have searched inside the file with `grep -n` "
	"in order to find the line numbers of what you are looking for.</NOTE>"
	)

	# Tool description
	_STR_REPLACE_EDITOR_DESCRIPTION = """Custom editing tool for viewing, creating and editing files
	* State is persistent across command calls and discussions with the user
	* If `path` is a file, `view` displays the result of applying `cat -n`. If `path` is a directory, `view` lists non-hidden files and directories up to 2 levels deep
	* The `create` command cannot be used if the specified `path` already exists as a file
	* If a `command` generates a long output, it will be truncated and marked with `<response clipped>`
	* The `undo_edit` command will revert the last edit made to the file at `path`

	Notes for using the `str_replace` command:
	* The `old_str` parameter should match EXACTLY one or more consecutive lines from the original file. Be mindful of whitespaces!
	* If the `old_str` parameter is not unique in the file, the replacement will not be performed. Make sure to include enough context in `old_str` to make it unique
	* The `new_str` parameter should contain the edited lines that should replace the `old_str`
	"""


	def maybe_truncate(
	content: str, truncate_after: Optional[int] = MAX_RESPONSE_LEN
	) -> str:
	"""Truncate content and append a notice if content exceeds the specified length."""
	if not truncate_after or len(content) <= truncate_after:
	return content
	return content[:truncate_after] + TRUNCATED_MESSAGE


	class StrReplaceEditor(BaseTool):
	"""A tool for viewing, creating, and editing files with sandbox support."""

	name: str = "str_replace_editor"
	description: str = _STR_REPLACE_EDITOR_DESCRIPTION
	parameters: dict = {
	"type": "object",
	"properties": {
	"command": {
	"description": "The commands to run. Allowed options are: `view`, `create`, `str_replace`, `insert`, `undo_edit`.",
	"enum": ["view", "create", "str_replace", "insert", "undo_edit"],
	"type": "string",
	},
	"path": {
	"description": "Absolute path to file or directory.",
	"type": "string",
	},
	"file_text": {
	"description": "Required parameter of `create` command, with the content of the file to be created.",
	"type": "string",
	},
	"old_str": {
	"description": "Required parameter of `str_replace` command containing the string in `path` to replace.",
	"type": "string",
	},
	"new_str": {
	"description": "Optional parameter of `str_replace` command containing the new string (if not given, no string will be added). Required parameter of `insert` command containing the string to insert.",
	"type": "string",
	},
	"insert_line": {
	"description": "Required parameter of `insert` command. The `new_str` will be inserted AFTER the line `insert_line` of `path`.",
	"type": "integer",
	},
	"view_range": {
	"description": "Optional parameter of `view` command when `path` points to a file. If none is given, the full file is shown. If provided, the file will be shown in the indicated line number range, e.g. [11, 12] will show lines 11 and 12. Indexing at 1 to start. Setting `[start_line, -1]` shows all lines from `start_line` to the end of the file.",
	"items": {"type": "integer"},
	"type": "array",
	},
	},
	"required": ["command", "path"],
	}
	_file_history: DefaultDict[PathLike, List[str]] = defaultdict(list)
	_local_operator: LocalFileOperator = LocalFileOperator()
	_sandbox_operator: SandboxFileOperator = SandboxFileOperator()

	# def _get_operator(self, use_sandbox: bool) -> FileOperator:
	def _get_operator(self) -> FileOperator:
	"""Get the appropriate file operator based on execution mode."""
	return (
	self._sandbox_operator
	if config.sandbox.use_sandbox
	else self._local_operator
	)

	async def execute(
	self,
	*,
	command: Command,
	path: str,
	file_text: str \| None = None,
	view_range: list[int] \| None = None,
	old_str: str \| None = None,
	new_str: str \| None = None,
	insert_line: int \| None = None,
	**kwargs: Any,
	) -> str:
	"""Execute a file operation command."""
	# Get the appropriate file operator
	operator = self._get_operator()

	# Validate path and command combination
	await self.validate_path(command, Path(path), operator)

	# Execute the appropriate command
	if command == "view":
	result = await self.view(path, view_range, operator)
	elif command == "create":
	if file_text is None:
	raise ToolError("Parameter `file_text` is required for command: create")
	await operator.write_file(path, file_text)
	self._file_history[path].append(file_text)
	result = ToolResult(output=f"File created successfully at: {path}")
	elif command == "str_replace":
	if old_str is None:
	raise ToolError(
	"Parameter `old_str` is required for command: str_replace"
	)
	result = await self.str_replace(path, old_str, new_str, operator)
	elif command == "insert":
	if insert_line is None:
	raise ToolError(
	"Parameter `insert_line` is required for command: insert"
	)
	if new_str is None:
	raise ToolError("Parameter `new_str` is required for command: insert")
	result = await self.insert(path, insert_line, new_str, operator)
	elif command == "undo_edit":
	result = await self.undo_edit(path, operator)
	else:
	# This should be caught by type checking, but we include it for safety
	raise ToolError(
	f'Unrecognized command {command}. The allowed commands for the {self.name} tool are: {", ".join(get_args(Command))}'
	)

	return str(result)

	async def validate_path(
	self, command: str, path: Path, operator: FileOperator
	) -> None:
	"""Validate path and command combination based on execution environment."""
	# Check if path is absolute
	if not path.is_absolute():
	raise ToolError(f"The path {path} is not an absolute path")

	# Only check if path exists for non-create commands
	if command != "create":
	if not await operator.exists(path):
	raise ToolError(
	f"The path {path} does not exist. Please provide a valid path."
	)

	# Check if path is a directory
	is_dir = await operator.is_directory(path)
	if is_dir and command != "view":
	raise ToolError(
	f"The path {path} is a directory and only the `view` command can be used on directories"
	)

	# Check if file exists for create command
	elif command == "create":
	exists = await operator.exists(path)
	if exists:
	raise ToolError(
	f"File already exists at: {path}. Cannot overwrite files using command `create`."
	)

	async def view(
	self,
	path: PathLike,
	view_range: Optional[List[int]] = None,
	operator: FileOperator = None,
	) -> CLIResult:
	"""Display file or directory content."""
	# Determine if path is a directory
	is_dir = await operator.is_directory(path)

	if is_dir:
	# Directory handling
	if view_range:
	raise ToolError(
	"The `view_range` parameter is not allowed when `path` points to a directory."
	)

	return await self._view_directory(path, operator)
	else:
	# File handling
	return await self._view_file(path, operator, view_range)

	@staticmethod
	async def _view_directory(path: PathLike, operator: FileOperator) -> CLIResult:
	"""Display directory contents."""
	find_cmd = f"find {path} -maxdepth 2 -not -path '/\\.'"

	# Execute command using the operator
	returncode, stdout, stderr = await operator.run_command(find_cmd)

	if not stderr:
	stdout = (
	f"Here's the files and directories up to 2 levels deep in {path}, "
	f"excluding hidden items:\n{stdout}\n"
	)

	return CLIResult(output=stdout, error=stderr)

	async def _view_file(
	self,
	path: PathLike,
	operator: FileOperator,
	view_range: Optional[List[int]] = None,
	) -> CLIResult:
	"""Display file content, optionally within a specified line range."""
	# Read file content
	file_content = await operator.read_file(path)
	init_line = 1

	# Apply view range if specified
	if view_range:
	if len(view_range) != 2 or not all(isinstance(i, int) for i in view_range):
	raise ToolError(
	"Invalid `view_range`. It should be a list of two integers."
	)

	file_lines = file_content.split("\n")
	n_lines_file = len(file_lines)
	init_line, final_line = view_range

	# Validate view range
	if init_line < 1 or init_line > n_lines_file:
	raise ToolError(
	f"Invalid `view_range`: {view_range}. Its first element `{init_line}` should be "
	f"within the range of lines of the file: {[1, n_lines_file]}"
	)
	if final_line > n_lines_file:
	raise ToolError(
	f"Invalid `view_range`: {view_range}. Its second element `{final_line}` should be "
	f"smaller than the number of lines in the file: `{n_lines_file}`"
	)
	if final_line != -1 and final_line < init_line:
	raise ToolError(
	f"Invalid `view_range`: {view_range}. Its second element `{final_line}` should be "
	f"larger or equal than its first `{init_line}`"
	)

	# Apply range
	if final_line == -1:
	file_content = "\n".join(file_lines[init_line - 1 :])
	else:
	file_content = "\n".join(file_lines[init_line - 1 : final_line])

	# Format and return result
	return CLIResult(
	output=self._make_output(file_content, str(path), init_line=init_line)
	)

	async def str_replace(
	self,
	path: PathLike,
	old_str: str,
	new_str: Optional[str] = None,
	operator: FileOperator = None,
	) -> CLIResult:
	"""Replace a unique string in a file with a new string."""
	# Read file content and expand tabs
	file_content = (await operator.read_file(path)).expandtabs()
	old_str = old_str.expandtabs()
	new_str = new_str.expandtabs() if new_str is not None else ""

	# Check if old_str is unique in the file
	occurrences = file_content.count(old_str)
	if occurrences == 0:
	raise ToolError(
	f"No replacement was performed, old_str `{old_str}` did not appear verbatim in {path}."
	)
	elif occurrences > 1:
	# Find line numbers of occurrences
	file_content_lines = file_content.split("\n")
	lines = [
	idx + 1
	for idx, line in enumerate(file_content_lines)
	if old_str in line
	]
	raise ToolError(
	f"No replacement was performed. Multiple occurrences of old_str `{old_str}` "
	f"in lines {lines}. Please ensure it is unique"
	)

	# Replace old_str with new_str
	new_file_content = file_content.replace(old_str, new_str)

	# Write the new content to the file
	await operator.write_file(path, new_file_content)

	# Save the original content to history
	self._file_history[path].append(file_content)

	# Create a snippet of the edited section
	replacement_line = file_content.split(old_str)[0].count("\n")
	start_line = max(0, replacement_line - SNIPPET_LINES)
	end_line = replacement_line + SNIPPET_LINES + new_str.count("\n")
	snippet = "\n".join(new_file_content.split("\n")[start_line : end_line + 1])

	# Prepare the success message
	success_msg = f"The file {path} has been edited. "
	success_msg += self._make_output(
	snippet, f"a snippet of {path}", start_line + 1
	)
	success_msg += "Review the changes and make sure they are as expected. Edit the file again if necessary."

	return CLIResult(output=success_msg)

	async def insert(
	self,
	path: PathLike,
	insert_line: int,
	new_str: str,
	operator: FileOperator = None,
	) -> CLIResult:
	"""Insert text at a specific line in a file."""
	# Read and prepare content
	file_text = (await operator.read_file(path)).expandtabs()
	new_str = new_str.expandtabs()
	file_text_lines = file_text.split("\n")
	n_lines_file = len(file_text_lines)

	# Validate insert_line
	if insert_line < 0 or insert_line > n_lines_file:
	raise ToolError(
	f"Invalid `insert_line` parameter: {insert_line}. It should be within "
	f"the range of lines of the file: {[0, n_lines_file]}"
	)

	# Perform insertion
	new_str_lines = new_str.split("\n")
	new_file_text_lines = (
	file_text_lines[:insert_line]
	+ new_str_lines
	+ file_text_lines[insert_line:]
	)

	# Create a snippet for preview
	snippet_lines = (
	file_text_lines[max(0, insert_line - SNIPPET_LINES) : insert_line]
	+ new_str_lines
	+ file_text_lines[insert_line : insert_line + SNIPPET_LINES]
	)

	# Join lines and write to file
	new_file_text = "\n".join(new_file_text_lines)
	snippet = "\n".join(snippet_lines)

	await operator.write_file(path, new_file_text)
	self._file_history[path].append(file_text)

	# Prepare success message
	success_msg = f"The file {path} has been edited. "
	success_msg += self._make_output(
	snippet,
	"a snippet of the edited file",
	max(1, insert_line - SNIPPET_LINES + 1),
	)
	success_msg += "Review the changes and make sure they are as expected (correct indentation, no duplicate lines, etc). Edit the file again if necessary."

	return CLIResult(output=success_msg)

	async def undo_edit(
	self, path: PathLike, operator: FileOperator = None
	) -> CLIResult:
	"""Revert the last edit made to a file."""
	if not self._file_history[path]:
	raise ToolError(f"No edit history found for {path}.")

	old_text = self._file_history[path].pop()
	await operator.write_file(path, old_text)

	return CLIResult(
	output=f"Last edit to {path} undone successfully. {self._make_output(old_text, str(path))}"
	)

	def _make_output(
	self,
	file_content: str,
	file_descriptor: str,
	init_line: int = 1,
	expand_tabs: bool = True,
	) -> str:
	"""Format file content for display with line numbers."""
	file_content = maybe_truncate(file_content)
	if expand_tabs:
	file_content = file_content.expandtabs()

	# Add line numbers to each line
	file_content = "\n".join(
	[
	f"{i + init_line:6}\t{line}"
	for i, line in enumerate(file_content.split("\n"))
	]
	)

	return (
	f"Here's the result of running `cat -n` on {file_descriptor}:\n"
	+ file_content
	+ "\n"
	)