Back to Repositories

Testing Agent Skill File Operations and Document Parsing in OpenHands

This test suite validates the agent skill functionality in OpenHands, focusing on file operations and document parsing capabilities. It includes comprehensive tests for file navigation, search operations, and multi-format document handling.

Test Coverage Overview

The test suite provides extensive coverage of file operation skills including:
  • File opening and navigation (goto_line, scroll_up/down)
  • File searching and content matching
  • Document parsing for multiple formats (PDF, DOCX, LaTeX, PPTX)
  • Edge case handling for file operations
Integration points include file system operations, document processing libraries, and I/O handling.

Implementation Analysis

The testing approach uses pytest fixtures and context managers to isolate tests and capture output.
Key patterns include:
  • Temporary file/directory creation for safe testing
  • Output redirection and validation
  • Parametrized test cases
  • Mocked file system operations
Makes extensive use of pytest’s tmp_path and monkeypatch features.

Technical Details

Testing tools and configuration:
  • pytest framework with fixtures
  • contextlib for I/O redirection
  • Document processing libraries (docx, reportlab, pptx)
  • StringIO for output capture
  • Temporary file system management

Best Practices Demonstrated

The test suite exemplifies testing best practices through isolated test cases, comprehensive assertions, and proper resource cleanup.
  • Fixture usage for test setup/teardown
  • Proper error case validation
  • Modular test organization
  • Descriptive test naming
  • Thorough edge case coverage

all-hands-ai/openhands

tests/unit/test_agent_skill.py

            
import contextlib
import io
import sys

import docx
import pytest

from openhands.runtime.plugins.agent_skills.file_ops.file_ops import (
    WINDOW,
    _print_window,
    find_file,
    goto_line,
    open_file,
    scroll_down,
    scroll_up,
    search_dir,
    search_file,
)
from openhands.runtime.plugins.agent_skills.file_reader.file_readers import (
    parse_docx,
    parse_latex,
    parse_pdf,
    parse_pptx,
)


# CURRENT_FILE must be reset for each test
@pytest.fixture(autouse=True)
def reset_current_file():
    from openhands.runtime.plugins.agent_skills import agentskills

    agentskills.CURRENT_FILE = None


def _numbered_test_lines(start, end) -> str:
    return ('
'.join(f'{i}|' for i in range(start, end + 1))) + '
'


def _generate_test_file_with_lines(temp_path, num_lines) -> str:
    file_path = temp_path / 'test_file.py'
    file_path.write_text('
' * num_lines)
    return file_path


def _generate_ruby_test_file_with_lines(temp_path, num_lines) -> str:
    file_path = temp_path / 'test_file.rb'
    file_path.write_text('
' * num_lines)
    return file_path


def _calculate_window_bounds(current_line, total_lines, window_size):
    """Calculate the bounds of the window around the current line."""
    half_window = window_size // 2
    if current_line - half_window < 0:
        start = 1
        end = window_size
    else:
        start = current_line - half_window
        end = current_line + half_window
    return start, end


def _capture_file_operation_error(operation, expected_error_msg):
    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            operation()
        result = buf.getvalue().strip()
    assert result == expected_error_msg


SEP = '-' * 49 + '
'


# =============================================================================


def test_open_file_unexist_path():
    _capture_file_operation_error(
        lambda: open_file('/unexist/path/a.txt'),
        'ERROR: File /unexist/path/a.txt not found.',
    )


def test_open_file(tmp_path):
    assert tmp_path is not None
    temp_file_path = tmp_path / 'a.txt'
    temp_file_path.write_text('Line 1
Line 2
Line 3
Line 4
Line 5')

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            open_file(str(temp_file_path))
        result = buf.getvalue()
    assert result is not None
    expected = (
        f'[File: {temp_file_path} (5 lines total)]
'
        '(this is the beginning of the file)
'
        '1|Line 1
'
        '2|Line 2
'
        '3|Line 3
'
        '4|Line 4
'
        '5|Line 5
'
        '(this is the end of the file)
'
    )
    assert result.split('
') == expected.split('
')


def test_open_file_with_indentation(tmp_path):
    temp_file_path = tmp_path / 'a.txt'
    temp_file_path.write_text('Line 1
    Line 2
Line 3
Line 4
Line 5')

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            open_file(str(temp_file_path))
        result = buf.getvalue()
    assert result is not None
    expected = (
        f'[File: {temp_file_path} (5 lines total)]
'
        '(this is the beginning of the file)
'
        '1|Line 1
'
        '2|    Line 2
'
        '3|Line 3
'
        '4|Line 4
'
        '5|Line 5
'
        '(this is the end of the file)
'
    )
    assert result.split('
') == expected.split('
')


def test_open_file_long(tmp_path):
    temp_file_path = tmp_path / 'a.txt'
    content = '
'.join([f'Line {i}' for i in range(1, 1001)])
    temp_file_path.write_text(content)

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            open_file(str(temp_file_path), 1, 50)
        result = buf.getvalue()
    assert result is not None
    expected = f'[File: {temp_file_path} (1000 lines total)]
'
    expected += '(this is the beginning of the file)
'
    for i in range(1, 51):
        expected += f'{i}|Line {i}
'
    expected += '(950 more lines below)
'
    expected += '[Use `scroll_down` to view the next 100 lines of the file!]
'
    assert result.split('
') == expected.split('
')


def test_open_file_long_with_lineno(tmp_path):
    temp_file_path = tmp_path / 'a.txt'
    content = '
'.join([f'Line {i}' for i in range(1, 1001)])
    temp_file_path.write_text(content)

    cur_line = 100

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            open_file(str(temp_file_path), cur_line)
        result = buf.getvalue()
    assert result is not None
    expected = f'[File: {temp_file_path} (1000 lines total)]
'
    # since 100 is < WINDOW and 100 - WINDOW//2 < 0, so it should show all lines from 1 to WINDOW

    start, end = _calculate_window_bounds(cur_line, 1000, WINDOW)
    if start == 1:
        expected += '(this is the beginning of the file)
'
    else:
        expected += f'({start - 1} more lines above)
'
    for i in range(start, end + 1):
        expected += f'{i}|Line {i}
'
    if end == 1000:
        expected += '(this is the end of the file)
'
    else:
        expected += f'({1000 - end} more lines below)
'
        expected += '[Use `scroll_down` to view the next 100 lines of the file!]
'
    assert result.split('
') == expected.split('
')


def test_goto_line(tmp_path):
    temp_file_path = tmp_path / 'a.txt'
    total_lines = 1000
    content = '
'.join([f'Line {i}' for i in range(1, total_lines + 1)])
    temp_file_path.write_text(content)

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            open_file(str(temp_file_path))
        result = buf.getvalue()
    assert result is not None

    expected = f'[File: {temp_file_path} ({total_lines} lines total)]
'
    expected += '(this is the beginning of the file)
'
    for i in range(1, WINDOW + 1):
        expected += f'{i}|Line {i}
'
    expected += f'({total_lines - WINDOW} more lines below)
'
    expected += '[Use `scroll_down` to view the next 100 lines of the file!]
'
    assert result.split('
') == expected.split('
')

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            goto_line(500)
        result = buf.getvalue()
    assert result is not None

    cur_line = 500
    expected = f'[File: {temp_file_path} ({total_lines} lines total)]
'
    start, end = _calculate_window_bounds(cur_line, total_lines, WINDOW)
    if start == 1:
        expected += '(this is the beginning of the file)
'
    else:
        expected += f'({start - 1} more lines above)
'
    for i in range(start, end + 1):
        expected += f'{i}|Line {i}
'
    if end == total_lines:
        expected += '(this is the end of the file)
'
    else:
        expected += f'({total_lines - end} more lines below)
'
    assert result.split('
') == expected.split('
')


def test_goto_line_negative(tmp_path):
    temp_file_path = tmp_path / 'a.txt'
    content = '
'.join([f'Line {i}' for i in range(1, 5)])
    temp_file_path.write_text(content)

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            open_file(str(temp_file_path))

    _capture_file_operation_error(
        lambda: goto_line(-1), 'ERROR: Line number must be between 1 and 4.'
    )


def test_goto_line_out_of_bound(tmp_path):
    temp_file_path = tmp_path / 'a.txt'
    content = '
'.join([f'Line {i}' for i in range(1, 10)])
    temp_file_path.write_text(content)

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            open_file(str(temp_file_path))

    _capture_file_operation_error(
        lambda: goto_line(100), 'ERROR: Line number must be between 1 and 9.'
    )


def test_scroll_down(tmp_path):
    temp_file_path = tmp_path / 'a.txt'
    total_lines = 1000
    content = '
'.join([f'Line {i}' for i in range(1, total_lines + 1)])
    temp_file_path.write_text(content)

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            open_file(str(temp_file_path))
        result = buf.getvalue()
    assert result is not None

    expected = f'[File: {temp_file_path} ({total_lines} lines total)]
'
    start, end = _calculate_window_bounds(1, total_lines, WINDOW)
    if start == 1:
        expected += '(this is the beginning of the file)
'
    else:
        expected += f'({start - 1} more lines above)
'
    for i in range(start, end + 1):
        expected += f'{i}|Line {i}
'
    if end == total_lines:
        expected += '(this is the end of the file)
'
    else:
        expected += f'({total_lines - end} more lines below)
'
        expected += '[Use `scroll_down` to view the next 100 lines of the file!]
'
    assert result.split('
') == expected.split('
')

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            scroll_down()
        result = buf.getvalue()
    assert result is not None

    expected = f'[File: {temp_file_path} ({total_lines} lines total)]
'
    start = WINDOW + 1
    end = 2 * WINDOW + 1
    if start == 1:
        expected += '(this is the beginning of the file)
'
    else:
        expected += f'({start - 1} more lines above)
'
    for i in range(start, end + 1):
        expected += f'{i}|Line {i}
'
    if end == total_lines:
        expected += '(this is the end of the file)
'
    else:
        expected += f'({total_lines - end} more lines below)
'
    assert result.split('
') == expected.split('
')


def test_scroll_up(tmp_path):
    temp_file_path = tmp_path / 'a.txt'
    total_lines = 1000
    content = '
'.join([f'Line {i}' for i in range(1, total_lines + 1)])
    temp_file_path.write_text(content)

    cur_line = 300
    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            open_file(str(temp_file_path), cur_line)
        result = buf.getvalue()
    assert result is not None

    expected = f'[File: {temp_file_path} ({total_lines} lines total)]
'
    start, end = _calculate_window_bounds(cur_line, total_lines, WINDOW)
    if start == 1:
        expected += '(this is the beginning of the file)
'
    else:
        expected += f'({start - 1} more lines above)
'
    for i in range(start, end + 1):
        expected += f'{i}|Line {i}
'
    if end == total_lines:
        expected += '(this is the end of the file)
'
    else:
        expected += f'({total_lines - end} more lines below)
'
        expected += '[Use `scroll_down` to view the next 100 lines of the file!]
'
    assert result.split('
') == expected.split('
')

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            scroll_up()
        result = buf.getvalue()
    assert result is not None

    cur_line = cur_line - WINDOW

    expected = f'[File: {temp_file_path} ({total_lines} lines total)]
'
    start = cur_line
    end = cur_line + WINDOW

    if start == 1:
        expected += '(this is the beginning of the file)
'
    else:
        expected += f'({start - 1} more lines above)
'
    for i in range(start, end + 1):
        expected += f'{i}|Line {i}
'
    if end == total_lines:
        expected += '(this is the end of the file)
'
    else:
        expected += f'({total_lines - end} more lines below)
'
    assert result.split('
') == expected.split('
')


def test_scroll_down_edge(tmp_path):
    temp_file_path = tmp_path / 'a.txt'
    content = '
'.join([f'Line {i}' for i in range(1, 10)])
    temp_file_path.write_text(content)

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            open_file(str(temp_file_path))
        result = buf.getvalue()
    assert result is not None

    expected = f'[File: {temp_file_path} (9 lines total)]
'
    expected += '(this is the beginning of the file)
'
    for i in range(1, 10):
        expected += f'{i}|Line {i}
'
    expected += '(this is the end of the file)
'

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            scroll_down()
        result = buf.getvalue()
    assert result is not None

    # expected should be unchanged
    assert result.split('
') == expected.split('
')


def test_print_window_internal(tmp_path):
    test_file_path = tmp_path / 'a.txt'
    test_file_path.write_text('')
    open_file(str(test_file_path))
    with open(test_file_path, 'w') as file:
        for i in range(1, 101):
            file.write(f'Line `{i}`
')

    # Define the parameters for the test
    current_line = 50
    window = 2

    # Test _print_window especially with backticks
    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            _print_window(str(test_file_path), current_line, window, return_str=False)
        result = buf.getvalue()
        expected = (
            '(48 more lines above)
'
            '49|Line `49`
'
            '50|Line `50`
'
            '51|Line `51`
'
            '(49 more lines below)
'
        )
        assert result == expected


def test_open_file_large_line_number(tmp_path):
    test_file_path = tmp_path / 'a.txt'
    test_file_path.write_text('')
    open_file(str(test_file_path))
    with open(test_file_path, 'w') as file:
        for i in range(1, 1000):
            file.write(f'Line `{i}`
')

    # Define the parameters for the test
    current_line = 800
    window = 100

    # Test _print_window especially with backticks
    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            # _print_window(str(test_file_path), current_line, window, return_str=False)
            open_file(str(test_file_path), current_line, window)
        result = buf.getvalue()
        expected = f'[File: {test_file_path} (999 lines total)]
'
        expected += '(749 more lines above)
'
        for i in range(750, 850 + 1):
            expected += f'{i}|Line `{i}`
'
        expected += '(149 more lines below)
'
        expected += '[Use `scroll_down` to view the next 100 lines of the file!]
'
        assert result == expected


def test_search_dir(tmp_path):
    # create files with the search term "bingo"
    for i in range(1, 101):
        temp_file_path = tmp_path / f'a{i}.txt'
        with open(temp_file_path, 'w') as file:
            file.write('Line 1
Line 2
Line 3
Line 4
Line 5
')
            if i == 50:
                file.write('bingo')

    # test
    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            search_dir('bingo', str(tmp_path))
        result = buf.getvalue()
    assert result is not None

    expected = (
        f'[Found 1 matches for "bingo" in {tmp_path}]
'
        f'{tmp_path}/a50.txt (Line 6): bingo
'
        f'[End of matches for "bingo" in {tmp_path}]
'
    )
    assert result.split('
') == expected.split('
')


def test_search_dir_not_exist_term(tmp_path):
    # create files with the search term "bingo"
    for i in range(1, 101):
        temp_file_path = tmp_path / f'a{i}.txt'
        with open(temp_file_path, 'w') as file:
            file.write('Line 1
Line 2
Line 3
Line 4
Line 5
')

    # test
    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            search_dir('non-exist', str(tmp_path))
        result = buf.getvalue()
    assert result is not None

    expected = f'No matches found for "non-exist" in {tmp_path}
'
    assert result.split('
') == expected.split('
')


def test_search_dir_too_much_match(tmp_path):
    # create files with the search term "Line 5"
    for i in range(1, 1000):
        temp_file_path = tmp_path / f'a{i}.txt'
        with open(temp_file_path, 'w') as file:
            file.write('Line 1
Line 2
Line 3
Line 4
Line 5
')

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            search_dir('Line 5', str(tmp_path))
        result = buf.getvalue()
    assert result is not None

    expected = f'More than 999 files matched for "Line 5" in {tmp_path}. Please narrow your search.
'
    assert result.split('
') == expected.split('
')


def test_search_dir_cwd(tmp_path, monkeypatch):
    # Using pytest's monkeypatch to change directory without affecting other tests
    monkeypatch.chdir(tmp_path)
    # create files with the search term "bingo"
    for i in range(1, 101):
        temp_file_path = tmp_path / f'a{i}.txt'
        with open(temp_file_path, 'w') as file:
            file.write('Line 1
Line 2
Line 3
Line 4
Line 5
')
            if i == 50:
                file.write('bingo')

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            search_dir('bingo')
        result = buf.getvalue()
    assert result is not None

    expected = (
        '[Found 1 matches for "bingo" in ./]
'
        './a50.txt (Line 6): bingo
'
        '[End of matches for "bingo" in ./]
'
    )
    assert result.split('
') == expected.split('
')


def test_search_file(tmp_path):
    temp_file_path = tmp_path / 'a.txt'
    temp_file_path.write_text('Line 1
Line 2
Line 3
Line 4
Line 5')

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            search_file('Line 5', str(temp_file_path))
        result = buf.getvalue()
    assert result is not None
    expected = f'[Found 1 matches for "Line 5" in {temp_file_path}]
'
    expected += 'Line 5: Line 5
'
    expected += f'[End of matches for "Line 5" in {temp_file_path}]
'
    assert result.split('
') == expected.split('
')


def test_search_file_not_exist_term(tmp_path):
    temp_file_path = tmp_path / 'a.txt'
    temp_file_path.write_text('Line 1
Line 2
Line 3
Line 4
Line 5')

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            search_file('Line 6', str(temp_file_path))
        result = buf.getvalue()
    assert result is not None

    expected = f'[No matches found for "Line 6" in {temp_file_path}]
'
    assert result.split('
') == expected.split('
')


def test_search_file_not_exist_file():
    _capture_file_operation_error(
        lambda: search_file('Line 6', '/unexist/path/a.txt'),
        'ERROR: File /unexist/path/a.txt not found.',
    )


def test_find_file(tmp_path):
    temp_file_path = tmp_path / 'a.txt'
    temp_file_path.write_text('Line 1
Line 2
Line 3
Line 4
Line 5')

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            find_file('a.txt', str(tmp_path))
        result = buf.getvalue()
    assert result is not None

    expected = f'[Found 1 matches for "a.txt" in {tmp_path}]
'
    expected += f'{tmp_path}/a.txt
'
    expected += f'[End of matches for "a.txt" in {tmp_path}]
'
    assert result.split('
') == expected.split('
')


def test_find_file_cwd(tmp_path, monkeypatch):
    monkeypatch.chdir(tmp_path)
    temp_file_path = tmp_path / 'a.txt'
    temp_file_path.write_text('Line 1
Line 2
Line 3
Line 4
Line 5')

    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            find_file('a.txt')
        result = buf.getvalue()
    assert result is not None


def test_find_file_not_exist_file():
    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            find_file('nonexist.txt')
        result = buf.getvalue()
    assert result is not None

    expected = '[No matches found for "nonexist.txt" in ./]
'
    assert result.split('
') == expected.split('
')


def test_find_file_not_exist_file_specific_path(tmp_path):
    with io.StringIO() as buf:
        with contextlib.redirect_stdout(buf):
            find_file('nonexist.txt', str(tmp_path))
        result = buf.getvalue()
    assert result is not None

    expected = f'[No matches found for "nonexist.txt" in {tmp_path}]
'
    assert result.split('
') == expected.split('
')


def test_parse_docx(tmp_path):
    # Create a DOCX file with some content
    test_docx_path = tmp_path / 'test.docx'
    doc = docx.Document()
    doc.add_paragraph('Hello, this is a test document.')
    doc.add_paragraph('This is the second paragraph.')
    doc.save(str(test_docx_path))

    old_stdout = sys.stdout
    sys.stdout = io.StringIO()

    # Call the parse_docx function
    parse_docx(str(test_docx_path))

    # Capture the output
    output = sys.stdout.getvalue()
    sys.stdout = old_stdout

    # Check if the output is correct
    expected_output = (
        f'[Reading DOCX file from {test_docx_path}]
'
        '@@ Page 1 @@
Hello, this is a test document.

'
        '@@ Page 2 @@
This is the second paragraph.


'
    )
    assert output == expected_output, f'Expected output does not match. Got: {output}'


def test_parse_latex(tmp_path):
    # Create a LaTeX file with some content
    test_latex_path = tmp_path / 'test.tex'
    with open(test_latex_path, 'w') as f:
        f.write(r"""
        \documentclass{article}
        \begin{document}
        Hello, this is a test LaTeX document.
        \end{document}
        """)

    old_stdout = sys.stdout
    sys.stdout = io.StringIO()

    # Call the parse_latex function
    parse_latex(str(test_latex_path))

    # Capture the output
    output = sys.stdout.getvalue()
    sys.stdout = old_stdout

    # Check if the output is correct
    expected_output = (
        f'[Reading LaTex file from {test_latex_path}]
'
        'Hello, this is a test LaTeX document.
'
    )
    assert output == expected_output, f'Expected output does not match. Got: {output}'


def test_parse_pdf(tmp_path):
    # Create a PDF file with some content
    test_pdf_path = tmp_path / 'test.pdf'
    from reportlab.lib.pagesizes import letter
    from reportlab.pdfgen import canvas

    c = canvas.Canvas(str(test_pdf_path), pagesize=letter)
    c.drawString(100, 750, 'Hello, this is a test PDF document.')
    c.save()

    old_stdout = sys.stdout
    sys.stdout = io.StringIO()

    # Call the parse_pdf function
    parse_pdf(str(test_pdf_path))

    # Capture the output
    output = sys.stdout.getvalue()
    sys.stdout = old_stdout

    # Check if the output is correct
    expected_output = (
        f'[Reading PDF file from {test_pdf_path}]
'
        '@@ Page 1 @@
'
        'Hello, this is a test PDF document.
'
    )
    assert output == expected_output, f'Expected output does not match. Got: {output}'


def test_parse_pptx(tmp_path):
    test_pptx_path = tmp_path / 'test.pptx'
    from pptx import Presentation

    pres = Presentation()

    slide1 = pres.slides.add_slide(pres.slide_layouts[0])
    title1 = slide1.shapes.title
    title1.text = 'Hello, this is the first test PPTX slide.'

    slide2 = pres.slides.add_slide(pres.slide_layouts[0])
    title2 = slide2.shapes.title
    title2.text = 'Hello, this is the second test PPTX slide.'

    pres.save(str(test_pptx_path))

    old_stdout = sys.stdout
    sys.stdout = io.StringIO()

    parse_pptx(str(test_pptx_path))

    output = sys.stdout.getvalue()
    sys.stdout = old_stdout

    expected_output = (
        f'[Reading PowerPoint file from {test_pptx_path}]
'
        '@@ Slide 1 @@
'
        'Hello, this is the first test PPTX slide.

'
        '@@ Slide 2 @@
'
        'Hello, this is the second test PPTX slide.

'
    )
    assert output == expected_output, f'Expected output does not match. Got: {output}'