Testing Agent Skill File Operations and Document Parsing in OpenHands
This test suite validates the agent skill functionality in OpenHands, focusing on file operations and document parsing capabilities. It includes comprehensive tests for file navigation, search operations, and multi-format document handling.
Test Coverage Overview
Implementation Analysis
Technical Details
Best Practices Demonstrated
all-hands-ai/openhands
tests/unit/test_agent_skill.py
import contextlib
import io
import sys
import docx
import pytest
from openhands.runtime.plugins.agent_skills.file_ops.file_ops import (
WINDOW,
_print_window,
find_file,
goto_line,
open_file,
scroll_down,
scroll_up,
search_dir,
search_file,
)
from openhands.runtime.plugins.agent_skills.file_reader.file_readers import (
parse_docx,
parse_latex,
parse_pdf,
parse_pptx,
)
# CURRENT_FILE must be reset for each test
@pytest.fixture(autouse=True)
def reset_current_file():
from openhands.runtime.plugins.agent_skills import agentskills
agentskills.CURRENT_FILE = None
def _numbered_test_lines(start, end) -> str:
return ('
'.join(f'{i}|' for i in range(start, end + 1))) + '
'
def _generate_test_file_with_lines(temp_path, num_lines) -> str:
file_path = temp_path / 'test_file.py'
file_path.write_text('
' * num_lines)
return file_path
def _generate_ruby_test_file_with_lines(temp_path, num_lines) -> str:
file_path = temp_path / 'test_file.rb'
file_path.write_text('
' * num_lines)
return file_path
def _calculate_window_bounds(current_line, total_lines, window_size):
"""Calculate the bounds of the window around the current line."""
half_window = window_size // 2
if current_line - half_window < 0:
start = 1
end = window_size
else:
start = current_line - half_window
end = current_line + half_window
return start, end
def _capture_file_operation_error(operation, expected_error_msg):
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
operation()
result = buf.getvalue().strip()
assert result == expected_error_msg
SEP = '-' * 49 + '
'
# =============================================================================
def test_open_file_unexist_path():
_capture_file_operation_error(
lambda: open_file('/unexist/path/a.txt'),
'ERROR: File /unexist/path/a.txt not found.',
)
def test_open_file(tmp_path):
assert tmp_path is not None
temp_file_path = tmp_path / 'a.txt'
temp_file_path.write_text('Line 1
Line 2
Line 3
Line 4
Line 5')
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
open_file(str(temp_file_path))
result = buf.getvalue()
assert result is not None
expected = (
f'[File: {temp_file_path} (5 lines total)]
'
'(this is the beginning of the file)
'
'1|Line 1
'
'2|Line 2
'
'3|Line 3
'
'4|Line 4
'
'5|Line 5
'
'(this is the end of the file)
'
)
assert result.split('
') == expected.split('
')
def test_open_file_with_indentation(tmp_path):
temp_file_path = tmp_path / 'a.txt'
temp_file_path.write_text('Line 1
Line 2
Line 3
Line 4
Line 5')
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
open_file(str(temp_file_path))
result = buf.getvalue()
assert result is not None
expected = (
f'[File: {temp_file_path} (5 lines total)]
'
'(this is the beginning of the file)
'
'1|Line 1
'
'2| Line 2
'
'3|Line 3
'
'4|Line 4
'
'5|Line 5
'
'(this is the end of the file)
'
)
assert result.split('
') == expected.split('
')
def test_open_file_long(tmp_path):
temp_file_path = tmp_path / 'a.txt'
content = '
'.join([f'Line {i}' for i in range(1, 1001)])
temp_file_path.write_text(content)
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
open_file(str(temp_file_path), 1, 50)
result = buf.getvalue()
assert result is not None
expected = f'[File: {temp_file_path} (1000 lines total)]
'
expected += '(this is the beginning of the file)
'
for i in range(1, 51):
expected += f'{i}|Line {i}
'
expected += '(950 more lines below)
'
expected += '[Use `scroll_down` to view the next 100 lines of the file!]
'
assert result.split('
') == expected.split('
')
def test_open_file_long_with_lineno(tmp_path):
temp_file_path = tmp_path / 'a.txt'
content = '
'.join([f'Line {i}' for i in range(1, 1001)])
temp_file_path.write_text(content)
cur_line = 100
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
open_file(str(temp_file_path), cur_line)
result = buf.getvalue()
assert result is not None
expected = f'[File: {temp_file_path} (1000 lines total)]
'
# since 100 is < WINDOW and 100 - WINDOW//2 < 0, so it should show all lines from 1 to WINDOW
start, end = _calculate_window_bounds(cur_line, 1000, WINDOW)
if start == 1:
expected += '(this is the beginning of the file)
'
else:
expected += f'({start - 1} more lines above)
'
for i in range(start, end + 1):
expected += f'{i}|Line {i}
'
if end == 1000:
expected += '(this is the end of the file)
'
else:
expected += f'({1000 - end} more lines below)
'
expected += '[Use `scroll_down` to view the next 100 lines of the file!]
'
assert result.split('
') == expected.split('
')
def test_goto_line(tmp_path):
temp_file_path = tmp_path / 'a.txt'
total_lines = 1000
content = '
'.join([f'Line {i}' for i in range(1, total_lines + 1)])
temp_file_path.write_text(content)
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
open_file(str(temp_file_path))
result = buf.getvalue()
assert result is not None
expected = f'[File: {temp_file_path} ({total_lines} lines total)]
'
expected += '(this is the beginning of the file)
'
for i in range(1, WINDOW + 1):
expected += f'{i}|Line {i}
'
expected += f'({total_lines - WINDOW} more lines below)
'
expected += '[Use `scroll_down` to view the next 100 lines of the file!]
'
assert result.split('
') == expected.split('
')
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
goto_line(500)
result = buf.getvalue()
assert result is not None
cur_line = 500
expected = f'[File: {temp_file_path} ({total_lines} lines total)]
'
start, end = _calculate_window_bounds(cur_line, total_lines, WINDOW)
if start == 1:
expected += '(this is the beginning of the file)
'
else:
expected += f'({start - 1} more lines above)
'
for i in range(start, end + 1):
expected += f'{i}|Line {i}
'
if end == total_lines:
expected += '(this is the end of the file)
'
else:
expected += f'({total_lines - end} more lines below)
'
assert result.split('
') == expected.split('
')
def test_goto_line_negative(tmp_path):
temp_file_path = tmp_path / 'a.txt'
content = '
'.join([f'Line {i}' for i in range(1, 5)])
temp_file_path.write_text(content)
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
open_file(str(temp_file_path))
_capture_file_operation_error(
lambda: goto_line(-1), 'ERROR: Line number must be between 1 and 4.'
)
def test_goto_line_out_of_bound(tmp_path):
temp_file_path = tmp_path / 'a.txt'
content = '
'.join([f'Line {i}' for i in range(1, 10)])
temp_file_path.write_text(content)
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
open_file(str(temp_file_path))
_capture_file_operation_error(
lambda: goto_line(100), 'ERROR: Line number must be between 1 and 9.'
)
def test_scroll_down(tmp_path):
temp_file_path = tmp_path / 'a.txt'
total_lines = 1000
content = '
'.join([f'Line {i}' for i in range(1, total_lines + 1)])
temp_file_path.write_text(content)
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
open_file(str(temp_file_path))
result = buf.getvalue()
assert result is not None
expected = f'[File: {temp_file_path} ({total_lines} lines total)]
'
start, end = _calculate_window_bounds(1, total_lines, WINDOW)
if start == 1:
expected += '(this is the beginning of the file)
'
else:
expected += f'({start - 1} more lines above)
'
for i in range(start, end + 1):
expected += f'{i}|Line {i}
'
if end == total_lines:
expected += '(this is the end of the file)
'
else:
expected += f'({total_lines - end} more lines below)
'
expected += '[Use `scroll_down` to view the next 100 lines of the file!]
'
assert result.split('
') == expected.split('
')
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
scroll_down()
result = buf.getvalue()
assert result is not None
expected = f'[File: {temp_file_path} ({total_lines} lines total)]
'
start = WINDOW + 1
end = 2 * WINDOW + 1
if start == 1:
expected += '(this is the beginning of the file)
'
else:
expected += f'({start - 1} more lines above)
'
for i in range(start, end + 1):
expected += f'{i}|Line {i}
'
if end == total_lines:
expected += '(this is the end of the file)
'
else:
expected += f'({total_lines - end} more lines below)
'
assert result.split('
') == expected.split('
')
def test_scroll_up(tmp_path):
temp_file_path = tmp_path / 'a.txt'
total_lines = 1000
content = '
'.join([f'Line {i}' for i in range(1, total_lines + 1)])
temp_file_path.write_text(content)
cur_line = 300
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
open_file(str(temp_file_path), cur_line)
result = buf.getvalue()
assert result is not None
expected = f'[File: {temp_file_path} ({total_lines} lines total)]
'
start, end = _calculate_window_bounds(cur_line, total_lines, WINDOW)
if start == 1:
expected += '(this is the beginning of the file)
'
else:
expected += f'({start - 1} more lines above)
'
for i in range(start, end + 1):
expected += f'{i}|Line {i}
'
if end == total_lines:
expected += '(this is the end of the file)
'
else:
expected += f'({total_lines - end} more lines below)
'
expected += '[Use `scroll_down` to view the next 100 lines of the file!]
'
assert result.split('
') == expected.split('
')
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
scroll_up()
result = buf.getvalue()
assert result is not None
cur_line = cur_line - WINDOW
expected = f'[File: {temp_file_path} ({total_lines} lines total)]
'
start = cur_line
end = cur_line + WINDOW
if start == 1:
expected += '(this is the beginning of the file)
'
else:
expected += f'({start - 1} more lines above)
'
for i in range(start, end + 1):
expected += f'{i}|Line {i}
'
if end == total_lines:
expected += '(this is the end of the file)
'
else:
expected += f'({total_lines - end} more lines below)
'
assert result.split('
') == expected.split('
')
def test_scroll_down_edge(tmp_path):
temp_file_path = tmp_path / 'a.txt'
content = '
'.join([f'Line {i}' for i in range(1, 10)])
temp_file_path.write_text(content)
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
open_file(str(temp_file_path))
result = buf.getvalue()
assert result is not None
expected = f'[File: {temp_file_path} (9 lines total)]
'
expected += '(this is the beginning of the file)
'
for i in range(1, 10):
expected += f'{i}|Line {i}
'
expected += '(this is the end of the file)
'
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
scroll_down()
result = buf.getvalue()
assert result is not None
# expected should be unchanged
assert result.split('
') == expected.split('
')
def test_print_window_internal(tmp_path):
test_file_path = tmp_path / 'a.txt'
test_file_path.write_text('')
open_file(str(test_file_path))
with open(test_file_path, 'w') as file:
for i in range(1, 101):
file.write(f'Line `{i}`
')
# Define the parameters for the test
current_line = 50
window = 2
# Test _print_window especially with backticks
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
_print_window(str(test_file_path), current_line, window, return_str=False)
result = buf.getvalue()
expected = (
'(48 more lines above)
'
'49|Line `49`
'
'50|Line `50`
'
'51|Line `51`
'
'(49 more lines below)
'
)
assert result == expected
def test_open_file_large_line_number(tmp_path):
test_file_path = tmp_path / 'a.txt'
test_file_path.write_text('')
open_file(str(test_file_path))
with open(test_file_path, 'w') as file:
for i in range(1, 1000):
file.write(f'Line `{i}`
')
# Define the parameters for the test
current_line = 800
window = 100
# Test _print_window especially with backticks
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
# _print_window(str(test_file_path), current_line, window, return_str=False)
open_file(str(test_file_path), current_line, window)
result = buf.getvalue()
expected = f'[File: {test_file_path} (999 lines total)]
'
expected += '(749 more lines above)
'
for i in range(750, 850 + 1):
expected += f'{i}|Line `{i}`
'
expected += '(149 more lines below)
'
expected += '[Use `scroll_down` to view the next 100 lines of the file!]
'
assert result == expected
def test_search_dir(tmp_path):
# create files with the search term "bingo"
for i in range(1, 101):
temp_file_path = tmp_path / f'a{i}.txt'
with open(temp_file_path, 'w') as file:
file.write('Line 1
Line 2
Line 3
Line 4
Line 5
')
if i == 50:
file.write('bingo')
# test
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
search_dir('bingo', str(tmp_path))
result = buf.getvalue()
assert result is not None
expected = (
f'[Found 1 matches for "bingo" in {tmp_path}]
'
f'{tmp_path}/a50.txt (Line 6): bingo
'
f'[End of matches for "bingo" in {tmp_path}]
'
)
assert result.split('
') == expected.split('
')
def test_search_dir_not_exist_term(tmp_path):
# create files with the search term "bingo"
for i in range(1, 101):
temp_file_path = tmp_path / f'a{i}.txt'
with open(temp_file_path, 'w') as file:
file.write('Line 1
Line 2
Line 3
Line 4
Line 5
')
# test
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
search_dir('non-exist', str(tmp_path))
result = buf.getvalue()
assert result is not None
expected = f'No matches found for "non-exist" in {tmp_path}
'
assert result.split('
') == expected.split('
')
def test_search_dir_too_much_match(tmp_path):
# create files with the search term "Line 5"
for i in range(1, 1000):
temp_file_path = tmp_path / f'a{i}.txt'
with open(temp_file_path, 'w') as file:
file.write('Line 1
Line 2
Line 3
Line 4
Line 5
')
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
search_dir('Line 5', str(tmp_path))
result = buf.getvalue()
assert result is not None
expected = f'More than 999 files matched for "Line 5" in {tmp_path}. Please narrow your search.
'
assert result.split('
') == expected.split('
')
def test_search_dir_cwd(tmp_path, monkeypatch):
# Using pytest's monkeypatch to change directory without affecting other tests
monkeypatch.chdir(tmp_path)
# create files with the search term "bingo"
for i in range(1, 101):
temp_file_path = tmp_path / f'a{i}.txt'
with open(temp_file_path, 'w') as file:
file.write('Line 1
Line 2
Line 3
Line 4
Line 5
')
if i == 50:
file.write('bingo')
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
search_dir('bingo')
result = buf.getvalue()
assert result is not None
expected = (
'[Found 1 matches for "bingo" in ./]
'
'./a50.txt (Line 6): bingo
'
'[End of matches for "bingo" in ./]
'
)
assert result.split('
') == expected.split('
')
def test_search_file(tmp_path):
temp_file_path = tmp_path / 'a.txt'
temp_file_path.write_text('Line 1
Line 2
Line 3
Line 4
Line 5')
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
search_file('Line 5', str(temp_file_path))
result = buf.getvalue()
assert result is not None
expected = f'[Found 1 matches for "Line 5" in {temp_file_path}]
'
expected += 'Line 5: Line 5
'
expected += f'[End of matches for "Line 5" in {temp_file_path}]
'
assert result.split('
') == expected.split('
')
def test_search_file_not_exist_term(tmp_path):
temp_file_path = tmp_path / 'a.txt'
temp_file_path.write_text('Line 1
Line 2
Line 3
Line 4
Line 5')
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
search_file('Line 6', str(temp_file_path))
result = buf.getvalue()
assert result is not None
expected = f'[No matches found for "Line 6" in {temp_file_path}]
'
assert result.split('
') == expected.split('
')
def test_search_file_not_exist_file():
_capture_file_operation_error(
lambda: search_file('Line 6', '/unexist/path/a.txt'),
'ERROR: File /unexist/path/a.txt not found.',
)
def test_find_file(tmp_path):
temp_file_path = tmp_path / 'a.txt'
temp_file_path.write_text('Line 1
Line 2
Line 3
Line 4
Line 5')
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
find_file('a.txt', str(tmp_path))
result = buf.getvalue()
assert result is not None
expected = f'[Found 1 matches for "a.txt" in {tmp_path}]
'
expected += f'{tmp_path}/a.txt
'
expected += f'[End of matches for "a.txt" in {tmp_path}]
'
assert result.split('
') == expected.split('
')
def test_find_file_cwd(tmp_path, monkeypatch):
monkeypatch.chdir(tmp_path)
temp_file_path = tmp_path / 'a.txt'
temp_file_path.write_text('Line 1
Line 2
Line 3
Line 4
Line 5')
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
find_file('a.txt')
result = buf.getvalue()
assert result is not None
def test_find_file_not_exist_file():
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
find_file('nonexist.txt')
result = buf.getvalue()
assert result is not None
expected = '[No matches found for "nonexist.txt" in ./]
'
assert result.split('
') == expected.split('
')
def test_find_file_not_exist_file_specific_path(tmp_path):
with io.StringIO() as buf:
with contextlib.redirect_stdout(buf):
find_file('nonexist.txt', str(tmp_path))
result = buf.getvalue()
assert result is not None
expected = f'[No matches found for "nonexist.txt" in {tmp_path}]
'
assert result.split('
') == expected.split('
')
def test_parse_docx(tmp_path):
# Create a DOCX file with some content
test_docx_path = tmp_path / 'test.docx'
doc = docx.Document()
doc.add_paragraph('Hello, this is a test document.')
doc.add_paragraph('This is the second paragraph.')
doc.save(str(test_docx_path))
old_stdout = sys.stdout
sys.stdout = io.StringIO()
# Call the parse_docx function
parse_docx(str(test_docx_path))
# Capture the output
output = sys.stdout.getvalue()
sys.stdout = old_stdout
# Check if the output is correct
expected_output = (
f'[Reading DOCX file from {test_docx_path}]
'
'@@ Page 1 @@
Hello, this is a test document.
'
'@@ Page 2 @@
This is the second paragraph.
'
)
assert output == expected_output, f'Expected output does not match. Got: {output}'
def test_parse_latex(tmp_path):
# Create a LaTeX file with some content
test_latex_path = tmp_path / 'test.tex'
with open(test_latex_path, 'w') as f:
f.write(r"""
\documentclass{article}
\begin{document}
Hello, this is a test LaTeX document.
\end{document}
""")
old_stdout = sys.stdout
sys.stdout = io.StringIO()
# Call the parse_latex function
parse_latex(str(test_latex_path))
# Capture the output
output = sys.stdout.getvalue()
sys.stdout = old_stdout
# Check if the output is correct
expected_output = (
f'[Reading LaTex file from {test_latex_path}]
'
'Hello, this is a test LaTeX document.
'
)
assert output == expected_output, f'Expected output does not match. Got: {output}'
def test_parse_pdf(tmp_path):
# Create a PDF file with some content
test_pdf_path = tmp_path / 'test.pdf'
from reportlab.lib.pagesizes import letter
from reportlab.pdfgen import canvas
c = canvas.Canvas(str(test_pdf_path), pagesize=letter)
c.drawString(100, 750, 'Hello, this is a test PDF document.')
c.save()
old_stdout = sys.stdout
sys.stdout = io.StringIO()
# Call the parse_pdf function
parse_pdf(str(test_pdf_path))
# Capture the output
output = sys.stdout.getvalue()
sys.stdout = old_stdout
# Check if the output is correct
expected_output = (
f'[Reading PDF file from {test_pdf_path}]
'
'@@ Page 1 @@
'
'Hello, this is a test PDF document.
'
)
assert output == expected_output, f'Expected output does not match. Got: {output}'
def test_parse_pptx(tmp_path):
test_pptx_path = tmp_path / 'test.pptx'
from pptx import Presentation
pres = Presentation()
slide1 = pres.slides.add_slide(pres.slide_layouts[0])
title1 = slide1.shapes.title
title1.text = 'Hello, this is the first test PPTX slide.'
slide2 = pres.slides.add_slide(pres.slide_layouts[0])
title2 = slide2.shapes.title
title2.text = 'Hello, this is the second test PPTX slide.'
pres.save(str(test_pptx_path))
old_stdout = sys.stdout
sys.stdout = io.StringIO()
parse_pptx(str(test_pptx_path))
output = sys.stdout.getvalue()
sys.stdout = old_stdout
expected_output = (
f'[Reading PowerPoint file from {test_pptx_path}]
'
'@@ Slide 1 @@
'
'Hello, this is the first test PPTX slide.
'
'@@ Slide 2 @@
'
'Hello, this is the second test PPTX slide.
'
)
assert output == expected_output, f'Expected output does not match. Got: {output}'