gabykim's picture
docstring before function definition
d9d9220
raw
history blame
5.22 kB
from know_lang_bot.code_parser.parser import CodeChunk, CodeParser, ChunkType
from pathlib import Path
from tests.test_constants import (
SIMPLE_FILE_EXPECTATIONS,
NESTED_CLASS_EXPECTATIONS,
COMPLEX_FILE_EXPECTATIONS,
INVALID_SYNTAX,
TEST_FILES,
)
import pytest
import tempfile
import git
@pytest.fixture
def temp_repo():
"""Create a temporary git repository with sample Python files"""
with tempfile.TemporaryDirectory() as temp_dir:
# Initialize git repo
repo = git.Repo.init(temp_dir)
# Create sample Python files
for filename, content in TEST_FILES.items():
file_path = Path(temp_dir) / filename
file_path.write_text(content)
repo.index.add([str(file_path)])
repo.index.commit("Initial commit")
yield temp_dir
def find_chunk_by_criteria(chunks: list[CodeChunk], **criteria) -> CodeChunk:
"""Helper function to find a chunk matching given criteria"""
for chunk in chunks:
if all(getattr(chunk, k) == v for k, v in criteria.items()):
return chunk
return None
def test_init_parser(temp_repo):
"""Test parser initialization"""
parser = CodeParser(temp_repo)
assert parser.repo_path == Path(temp_repo)
assert parser.language is not None
assert parser.parser is not None
def test_parse_simple_file(temp_repo):
"""Test parsing a simple Python file with function and class"""
parser = CodeParser(temp_repo)
chunks = parser.parse_file(Path(temp_repo) / "simple.py")
# Test function
function_chunk = find_chunk_by_criteria(chunks, type=ChunkType.FUNCTION, name="hello_world")
assert function_chunk is not None
expected = SIMPLE_FILE_EXPECTATIONS['hello_world']
assert expected.content_snippet in function_chunk.content
assert function_chunk.docstring is not None
assert function_chunk.docstring in expected.docstring
# Test class
class_chunk = find_chunk_by_criteria(chunks, type=ChunkType.CLASS, name="SimpleClass")
assert class_chunk is not None
expected = SIMPLE_FILE_EXPECTATIONS['SimpleClass']
assert expected.content_snippet in class_chunk.content
assert class_chunk.docstring is not None
assert class_chunk.docstring in expected.docstring
def test_parse_nested_classes(temp_repo):
"""Test parsing nested class definitions"""
parser = CodeParser(temp_repo)
chunks = parser.parse_file(Path(temp_repo) / "nested.py")
# Test outer class
outer_class = find_chunk_by_criteria(chunks, type=ChunkType.CLASS, name="OuterClass")
assert outer_class is not None
expected = NESTED_CLASS_EXPECTATIONS['OuterClass']
assert expected.content_snippet in outer_class.content
assert outer_class.docstring is not None
assert outer_class.docstring in expected.docstring
# Verify inner class: Not implemented yet
pass
def test_parse_complex_file(temp_repo):
"""Test parsing a complex Python file"""
parser = CodeParser(temp_repo)
chunks = parser.parse_file(Path(temp_repo) / "complex.py")
# Test function with type hints
complex_func = find_chunk_by_criteria(
chunks,
type=ChunkType.FUNCTION,
name="complex_function"
)
assert complex_func is not None
expected = COMPLEX_FILE_EXPECTATIONS['complex_function']
assert expected.content_snippet in complex_func.content
assert complex_func.docstring is not None
assert complex_func.docstring in expected.docstring
# Test complex class
complex_class = find_chunk_by_criteria(
chunks,
type=ChunkType.CLASS,
name="ComplexClass"
)
assert complex_class is not None
expected = COMPLEX_FILE_EXPECTATIONS['ComplexClass']
assert expected.content_snippet in complex_class.content
assert complex_class.docstring is not None
assert complex_class.docstring in expected.docstring
def test_parse_repository(temp_repo):
"""Test parsing entire repository"""
parser = CodeParser(temp_repo)
chunks = parser.parse_repository()
file_paths = {chunk.file_path for chunk in chunks}
assert len(file_paths) == 3
# Verify we can find chunks from each test file
for filename in TEST_FILES.keys():
file_chunks = [c for c in chunks if Path(c.file_path).name == filename]
assert len(file_chunks) > 0
def test_error_handling(temp_repo):
"""Test error handling for invalid files"""
parser = CodeParser(temp_repo)
# Test invalid syntax
invalid_file = Path(temp_repo) / "invalid.py"
invalid_file.write_text(INVALID_SYNTAX)
chunks = parser.parse_file(invalid_file)
assert chunks == []
# Test non-existent file
nonexistent = Path(temp_repo) / "nonexistent.py"
chunks = parser.parse_file(nonexistent)
assert chunks == []
def test_non_python_files(temp_repo):
"""Test handling of non-Python files"""
parser = CodeParser(temp_repo)
# Create a non-Python file
non_python = Path(temp_repo) / "readme.md"
non_python.write_text("# README")
# Should skip non-Python files
chunks = parser.parse_file(non_python)
assert chunks == []