Spaces:

ar08
/

zzz

Paused

App Files Files Community

zzz / tests /unit /test_agent_skill.py

ar08

Upload 1040 files

246d201 verified 8 months ago

raw

history blame

23.9 kB

	import contextlib
	import io
	import sys

	import docx
	import pytest

	from openhands.runtime.plugins.agent_skills.file_ops.file_ops import (
	WINDOW,
	_print_window,
	find_file,
	goto_line,
	open_file,
	scroll_down,
	scroll_up,
	search_dir,
	search_file,
	)
	from openhands.runtime.plugins.agent_skills.file_reader.file_readers import (
	parse_docx,
	parse_latex,
	parse_pdf,
	parse_pptx,
	)


	# CURRENT_FILE must be reset for each test
	@pytest.fixture(autouse=True)
	def reset_current_file():
	from openhands.runtime.plugins.agent_skills import agentskills

	agentskills.CURRENT_FILE = None


	def _numbered_test_lines(start, end) -> str:
	return ('\n'.join(f'{i}\|' for i in range(start, end + 1))) + '\n'


	def _generate_test_file_with_lines(temp_path, num_lines) -> str:
	file_path = temp_path / 'test_file.py'
	file_path.write_text('\n' * num_lines)
	return file_path


	def _generate_ruby_test_file_with_lines(temp_path, num_lines) -> str:
	file_path = temp_path / 'test_file.rb'
	file_path.write_text('\n' * num_lines)
	return file_path


	def _calculate_window_bounds(current_line, total_lines, window_size):
	"""Calculate the bounds of the window around the current line."""
	half_window = window_size // 2
	if current_line - half_window < 0:
	start = 1
	end = window_size
	else:
	start = current_line - half_window
	end = current_line + half_window
	return start, end


	def _capture_file_operation_error(operation, expected_error_msg):
	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	operation()
	result = buf.getvalue().strip()
	assert result == expected_error_msg


	SEP = '-' * 49 + '\n'


	# =============================================================================


	def test_open_file_unexist_path():
	_capture_file_operation_error(
	lambda: open_file('/unexist/path/a.txt'),
	'ERROR: File /unexist/path/a.txt not found.',
	)


	def test_open_file(tmp_path):
	assert tmp_path is not None
	temp_file_path = tmp_path / 'a.txt'
	temp_file_path.write_text('Line 1\nLine 2\nLine 3\nLine 4\nLine 5')

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	open_file(str(temp_file_path))
	result = buf.getvalue()
	assert result is not None
	expected = (
	f'[File: {temp_file_path} (5 lines total)]\n'
	'(this is the beginning of the file)\n'
	'1\|Line 1\n'
	'2\|Line 2\n'
	'3\|Line 3\n'
	'4\|Line 4\n'
	'5\|Line 5\n'
	'(this is the end of the file)\n'
	)
	assert result.split('\n') == expected.split('\n')


	def test_open_file_with_indentation(tmp_path):
	temp_file_path = tmp_path / 'a.txt'
	temp_file_path.write_text('Line 1\n Line 2\nLine 3\nLine 4\nLine 5')

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	open_file(str(temp_file_path))
	result = buf.getvalue()
	assert result is not None
	expected = (
	f'[File: {temp_file_path} (5 lines total)]\n'
	'(this is the beginning of the file)\n'
	'1\|Line 1\n'
	'2\| Line 2\n'
	'3\|Line 3\n'
	'4\|Line 4\n'
	'5\|Line 5\n'
	'(this is the end of the file)\n'
	)
	assert result.split('\n') == expected.split('\n')


	def test_open_file_long(tmp_path):
	temp_file_path = tmp_path / 'a.txt'
	content = '\n'.join([f'Line {i}' for i in range(1, 1001)])
	temp_file_path.write_text(content)

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	open_file(str(temp_file_path), 1, 50)
	result = buf.getvalue()
	assert result is not None
	expected = f'[File: {temp_file_path} (1000 lines total)]\n'
	expected += '(this is the beginning of the file)\n'
	for i in range(1, 51):
	expected += f'{i}\|Line {i}\n'
	expected += '(950 more lines below)\n'
	expected += '[Use `scroll_down` to view the next 100 lines of the file!]\n'
	assert result.split('\n') == expected.split('\n')


	def test_open_file_long_with_lineno(tmp_path):
	temp_file_path = tmp_path / 'a.txt'
	content = '\n'.join([f'Line {i}' for i in range(1, 1001)])
	temp_file_path.write_text(content)

	cur_line = 100

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	open_file(str(temp_file_path), cur_line)
	result = buf.getvalue()
	assert result is not None
	expected = f'[File: {temp_file_path} (1000 lines total)]\n'
	# since 100 is < WINDOW and 100 - WINDOW//2 < 0, so it should show all lines from 1 to WINDOW

	start, end = _calculate_window_bounds(cur_line, 1000, WINDOW)
	if start == 1:
	expected += '(this is the beginning of the file)\n'
	else:
	expected += f'({start - 1} more lines above)\n'
	for i in range(start, end + 1):
	expected += f'{i}\|Line {i}\n'
	if end == 1000:
	expected += '(this is the end of the file)\n'
	else:
	expected += f'({1000 - end} more lines below)\n'
	expected += '[Use `scroll_down` to view the next 100 lines of the file!]\n'
	assert result.split('\n') == expected.split('\n')


	def test_goto_line(tmp_path):
	temp_file_path = tmp_path / 'a.txt'
	total_lines = 1000
	content = '\n'.join([f'Line {i}' for i in range(1, total_lines + 1)])
	temp_file_path.write_text(content)

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	open_file(str(temp_file_path))
	result = buf.getvalue()
	assert result is not None

	expected = f'[File: {temp_file_path} ({total_lines} lines total)]\n'
	expected += '(this is the beginning of the file)\n'
	for i in range(1, WINDOW + 1):
	expected += f'{i}\|Line {i}\n'
	expected += f'({total_lines - WINDOW} more lines below)\n'
	expected += '[Use `scroll_down` to view the next 100 lines of the file!]\n'
	assert result.split('\n') == expected.split('\n')

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	goto_line(500)
	result = buf.getvalue()
	assert result is not None

	cur_line = 500
	expected = f'[File: {temp_file_path} ({total_lines} lines total)]\n'
	start, end = _calculate_window_bounds(cur_line, total_lines, WINDOW)
	if start == 1:
	expected += '(this is the beginning of the file)\n'
	else:
	expected += f'({start - 1} more lines above)\n'
	for i in range(start, end + 1):
	expected += f'{i}\|Line {i}\n'
	if end == total_lines:
	expected += '(this is the end of the file)\n'
	else:
	expected += f'({total_lines - end} more lines below)\n'
	assert result.split('\n') == expected.split('\n')


	def test_goto_line_negative(tmp_path):
	temp_file_path = tmp_path / 'a.txt'
	content = '\n'.join([f'Line {i}' for i in range(1, 5)])
	temp_file_path.write_text(content)

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	open_file(str(temp_file_path))

	_capture_file_operation_error(
	lambda: goto_line(-1), 'ERROR: Line number must be between 1 and 4.'
	)


	def test_goto_line_out_of_bound(tmp_path):
	temp_file_path = tmp_path / 'a.txt'
	content = '\n'.join([f'Line {i}' for i in range(1, 10)])
	temp_file_path.write_text(content)

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	open_file(str(temp_file_path))

	_capture_file_operation_error(
	lambda: goto_line(100), 'ERROR: Line number must be between 1 and 9.'
	)


	def test_scroll_down(tmp_path):
	temp_file_path = tmp_path / 'a.txt'
	total_lines = 1000
	content = '\n'.join([f'Line {i}' for i in range(1, total_lines + 1)])
	temp_file_path.write_text(content)

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	open_file(str(temp_file_path))
	result = buf.getvalue()
	assert result is not None

	expected = f'[File: {temp_file_path} ({total_lines} lines total)]\n'
	start, end = _calculate_window_bounds(1, total_lines, WINDOW)
	if start == 1:
	expected += '(this is the beginning of the file)\n'
	else:
	expected += f'({start - 1} more lines above)\n'
	for i in range(start, end + 1):
	expected += f'{i}\|Line {i}\n'
	if end == total_lines:
	expected += '(this is the end of the file)\n'
	else:
	expected += f'({total_lines - end} more lines below)\n'
	expected += '[Use `scroll_down` to view the next 100 lines of the file!]\n'
	assert result.split('\n') == expected.split('\n')

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	scroll_down()
	result = buf.getvalue()
	assert result is not None

	expected = f'[File: {temp_file_path} ({total_lines} lines total)]\n'
	start = WINDOW + 1
	end = 2 * WINDOW + 1
	if start == 1:
	expected += '(this is the beginning of the file)\n'
	else:
	expected += f'({start - 1} more lines above)\n'
	for i in range(start, end + 1):
	expected += f'{i}\|Line {i}\n'
	if end == total_lines:
	expected += '(this is the end of the file)\n'
	else:
	expected += f'({total_lines - end} more lines below)\n'
	assert result.split('\n') == expected.split('\n')


	def test_scroll_up(tmp_path):
	temp_file_path = tmp_path / 'a.txt'
	total_lines = 1000
	content = '\n'.join([f'Line {i}' for i in range(1, total_lines + 1)])
	temp_file_path.write_text(content)

	cur_line = 300
	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	open_file(str(temp_file_path), cur_line)
	result = buf.getvalue()
	assert result is not None

	expected = f'[File: {temp_file_path} ({total_lines} lines total)]\n'
	start, end = _calculate_window_bounds(cur_line, total_lines, WINDOW)
	if start == 1:
	expected += '(this is the beginning of the file)\n'
	else:
	expected += f'({start - 1} more lines above)\n'
	for i in range(start, end + 1):
	expected += f'{i}\|Line {i}\n'
	if end == total_lines:
	expected += '(this is the end of the file)\n'
	else:
	expected += f'({total_lines - end} more lines below)\n'
	expected += '[Use `scroll_down` to view the next 100 lines of the file!]\n'
	assert result.split('\n') == expected.split('\n')

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	scroll_up()
	result = buf.getvalue()
	assert result is not None

	cur_line = cur_line - WINDOW

	expected = f'[File: {temp_file_path} ({total_lines} lines total)]\n'
	start = cur_line
	end = cur_line + WINDOW

	if start == 1:
	expected += '(this is the beginning of the file)\n'
	else:
	expected += f'({start - 1} more lines above)\n'
	for i in range(start, end + 1):
	expected += f'{i}\|Line {i}\n'
	if end == total_lines:
	expected += '(this is the end of the file)\n'
	else:
	expected += f'({total_lines - end} more lines below)\n'
	assert result.split('\n') == expected.split('\n')


	def test_scroll_down_edge(tmp_path):
	temp_file_path = tmp_path / 'a.txt'
	content = '\n'.join([f'Line {i}' for i in range(1, 10)])
	temp_file_path.write_text(content)

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	open_file(str(temp_file_path))
	result = buf.getvalue()
	assert result is not None

	expected = f'[File: {temp_file_path} (9 lines total)]\n'
	expected += '(this is the beginning of the file)\n'
	for i in range(1, 10):
	expected += f'{i}\|Line {i}\n'
	expected += '(this is the end of the file)\n'

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	scroll_down()
	result = buf.getvalue()
	assert result is not None

	# expected should be unchanged
	assert result.split('\n') == expected.split('\n')


	def test_print_window_internal(tmp_path):
	test_file_path = tmp_path / 'a.txt'
	test_file_path.write_text('')
	open_file(str(test_file_path))
	with open(test_file_path, 'w') as file:
	for i in range(1, 101):
	file.write(f'Line `{i}`\n')

	# Define the parameters for the test
	current_line = 50
	window = 2

	# Test _print_window especially with backticks
	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	_print_window(str(test_file_path), current_line, window, return_str=False)
	result = buf.getvalue()
	expected = (
	'(48 more lines above)\n'
	'49\|Line `49`\n'
	'50\|Line `50`\n'
	'51\|Line `51`\n'
	'(49 more lines below)\n'
	)
	assert result == expected


	def test_open_file_large_line_number(tmp_path):
	test_file_path = tmp_path / 'a.txt'
	test_file_path.write_text('')
	open_file(str(test_file_path))
	with open(test_file_path, 'w') as file:
	for i in range(1, 1000):
	file.write(f'Line `{i}`\n')

	# Define the parameters for the test
	current_line = 800
	window = 100

	# Test _print_window especially with backticks
	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	# _print_window(str(test_file_path), current_line, window, return_str=False)
	open_file(str(test_file_path), current_line, window)
	result = buf.getvalue()
	expected = f'[File: {test_file_path} (999 lines total)]\n'
	expected += '(749 more lines above)\n'
	for i in range(750, 850 + 1):
	expected += f'{i}\|Line `{i}`\n'
	expected += '(149 more lines below)\n'
	expected += '[Use `scroll_down` to view the next 100 lines of the file!]\n'
	assert result == expected


	def test_search_dir(tmp_path):
	# create files with the search term "bingo"
	for i in range(1, 101):
	temp_file_path = tmp_path / f'a{i}.txt'
	with open(temp_file_path, 'w') as file:
	file.write('Line 1\nLine 2\nLine 3\nLine 4\nLine 5\n')
	if i == 50:
	file.write('bingo')

	# test
	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	search_dir('bingo', str(tmp_path))
	result = buf.getvalue()
	assert result is not None

	expected = (
	f'[Found 1 matches for "bingo" in {tmp_path}]\n'
	f'{tmp_path}/a50.txt (Line 6): bingo\n'
	f'[End of matches for "bingo" in {tmp_path}]\n'
	)
	assert result.split('\n') == expected.split('\n')


	def test_search_dir_not_exist_term(tmp_path):
	# create files with the search term "bingo"
	for i in range(1, 101):
	temp_file_path = tmp_path / f'a{i}.txt'
	with open(temp_file_path, 'w') as file:
	file.write('Line 1\nLine 2\nLine 3\nLine 4\nLine 5\n')

	# test
	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	search_dir('non-exist', str(tmp_path))
	result = buf.getvalue()
	assert result is not None

	expected = f'No matches found for "non-exist" in {tmp_path}\n'
	assert result.split('\n') == expected.split('\n')


	def test_search_dir_too_much_match(tmp_path):
	# create files with the search term "Line 5"
	for i in range(1, 1000):
	temp_file_path = tmp_path / f'a{i}.txt'
	with open(temp_file_path, 'w') as file:
	file.write('Line 1\nLine 2\nLine 3\nLine 4\nLine 5\n')

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	search_dir('Line 5', str(tmp_path))
	result = buf.getvalue()
	assert result is not None

	expected = f'More than 999 files matched for "Line 5" in {tmp_path}. Please narrow your search.\n'
	assert result.split('\n') == expected.split('\n')


	def test_search_dir_cwd(tmp_path, monkeypatch):
	# Using pytest's monkeypatch to change directory without affecting other tests
	monkeypatch.chdir(tmp_path)
	# create files with the search term "bingo"
	for i in range(1, 101):
	temp_file_path = tmp_path / f'a{i}.txt'
	with open(temp_file_path, 'w') as file:
	file.write('Line 1\nLine 2\nLine 3\nLine 4\nLine 5\n')
	if i == 50:
	file.write('bingo')

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	search_dir('bingo')
	result = buf.getvalue()
	assert result is not None

	expected = (
	'[Found 1 matches for "bingo" in ./]\n'
	'./a50.txt (Line 6): bingo\n'
	'[End of matches for "bingo" in ./]\n'
	)
	assert result.split('\n') == expected.split('\n')


	def test_search_file(tmp_path):
	temp_file_path = tmp_path / 'a.txt'
	temp_file_path.write_text('Line 1\nLine 2\nLine 3\nLine 4\nLine 5')

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	search_file('Line 5', str(temp_file_path))
	result = buf.getvalue()
	assert result is not None
	expected = f'[Found 1 matches for "Line 5" in {temp_file_path}]\n'
	expected += 'Line 5: Line 5\n'
	expected += f'[End of matches for "Line 5" in {temp_file_path}]\n'
	assert result.split('\n') == expected.split('\n')


	def test_search_file_not_exist_term(tmp_path):
	temp_file_path = tmp_path / 'a.txt'
	temp_file_path.write_text('Line 1\nLine 2\nLine 3\nLine 4\nLine 5')

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	search_file('Line 6', str(temp_file_path))
	result = buf.getvalue()
	assert result is not None

	expected = f'[No matches found for "Line 6" in {temp_file_path}]\n'
	assert result.split('\n') == expected.split('\n')


	def test_search_file_not_exist_file():
	_capture_file_operation_error(
	lambda: search_file('Line 6', '/unexist/path/a.txt'),
	'ERROR: File /unexist/path/a.txt not found.',
	)


	def test_find_file(tmp_path):
	temp_file_path = tmp_path / 'a.txt'
	temp_file_path.write_text('Line 1\nLine 2\nLine 3\nLine 4\nLine 5')

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	find_file('a.txt', str(tmp_path))
	result = buf.getvalue()
	assert result is not None

	expected = f'[Found 1 matches for "a.txt" in {tmp_path}]\n'
	expected += f'{tmp_path}/a.txt\n'
	expected += f'[End of matches for "a.txt" in {tmp_path}]\n'
	assert result.split('\n') == expected.split('\n')


	def test_find_file_cwd(tmp_path, monkeypatch):
	monkeypatch.chdir(tmp_path)
	temp_file_path = tmp_path / 'a.txt'
	temp_file_path.write_text('Line 1\nLine 2\nLine 3\nLine 4\nLine 5')

	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	find_file('a.txt')
	result = buf.getvalue()
	assert result is not None


	def test_find_file_not_exist_file():
	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	find_file('nonexist.txt')
	result = buf.getvalue()
	assert result is not None

	expected = '[No matches found for "nonexist.txt" in ./]\n'
	assert result.split('\n') == expected.split('\n')


	def test_find_file_not_exist_file_specific_path(tmp_path):
	with io.StringIO() as buf:
	with contextlib.redirect_stdout(buf):
	find_file('nonexist.txt', str(tmp_path))
	result = buf.getvalue()
	assert result is not None

	expected = f'[No matches found for "nonexist.txt" in {tmp_path}]\n'
	assert result.split('\n') == expected.split('\n')


	def test_parse_docx(tmp_path):
	# Create a DOCX file with some content
	test_docx_path = tmp_path / 'test.docx'
	doc = docx.Document()
	doc.add_paragraph('Hello, this is a test document.')
	doc.add_paragraph('This is the second paragraph.')
	doc.save(str(test_docx_path))

	old_stdout = sys.stdout
	sys.stdout = io.StringIO()

	# Call the parse_docx function
	parse_docx(str(test_docx_path))

	# Capture the output
	output = sys.stdout.getvalue()
	sys.stdout = old_stdout

	# Check if the output is correct
	expected_output = (
	f'[Reading DOCX file from {test_docx_path}]\n'
	'@@ Page 1 @@\nHello, this is a test document.\n\n'
	'@@ Page 2 @@\nThis is the second paragraph.\n\n\n'
	)
	assert output == expected_output, f'Expected output does not match. Got: {output}'


	def test_parse_latex(tmp_path):
	# Create a LaTeX file with some content
	test_latex_path = tmp_path / 'test.tex'
	with open(test_latex_path, 'w') as f:
	f.write(r"""
	\documentclass{article}
	\begin{document}
	Hello, this is a test LaTeX document.
	\end{document}
	""")

	old_stdout = sys.stdout
	sys.stdout = io.StringIO()

	# Call the parse_latex function
	parse_latex(str(test_latex_path))

	# Capture the output
	output = sys.stdout.getvalue()
	sys.stdout = old_stdout

	# Check if the output is correct
	expected_output = (
	f'[Reading LaTex file from {test_latex_path}]\n'
	'Hello, this is a test LaTeX document.\n'
	)
	assert output == expected_output, f'Expected output does not match. Got: {output}'


	def test_parse_pdf(tmp_path):
	# Create a PDF file with some content
	test_pdf_path = tmp_path / 'test.pdf'
	from reportlab.lib.pagesizes import letter
	from reportlab.pdfgen import canvas

	c = canvas.Canvas(str(test_pdf_path), pagesize=letter)
	c.drawString(100, 750, 'Hello, this is a test PDF document.')
	c.save()

	old_stdout = sys.stdout
	sys.stdout = io.StringIO()

	# Call the parse_pdf function
	parse_pdf(str(test_pdf_path))

	# Capture the output
	output = sys.stdout.getvalue()
	sys.stdout = old_stdout

	# Check if the output is correct
	expected_output = (
	f'[Reading PDF file from {test_pdf_path}]\n'
	'@@ Page 1 @@\n'
	'Hello, this is a test PDF document.\n'
	)
	assert output == expected_output, f'Expected output does not match. Got: {output}'


	def test_parse_pptx(tmp_path):
	test_pptx_path = tmp_path / 'test.pptx'
	from pptx import Presentation

	pres = Presentation()

	slide1 = pres.slides.add_slide(pres.slide_layouts[0])
	title1 = slide1.shapes.title
	title1.text = 'Hello, this is the first test PPTX slide.'

	slide2 = pres.slides.add_slide(pres.slide_layouts[0])
	title2 = slide2.shapes.title
	title2.text = 'Hello, this is the second test PPTX slide.'

	pres.save(str(test_pptx_path))

	old_stdout = sys.stdout
	sys.stdout = io.StringIO()

	parse_pptx(str(test_pptx_path))

	output = sys.stdout.getvalue()
	sys.stdout = old_stdout

	expected_output = (
	f'[Reading PowerPoint file from {test_pptx_path}]\n'
	'@@ Slide 1 @@\n'
	'Hello, this is the first test PPTX slide.\n\n'
	'@@ Slide 2 @@\n'
	'Hello, this is the second test PPTX slide.\n\n'
	)
	assert output == expected_output, f'Expected output does not match. Got: {output}'