File size: 540 Bytes
5e9cd1d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
import sys
from pathlib import Path

root_path = Path(__file__).parent.parent.parent
sys.path.append(str(root_path))
from pprint import pprint

test_files = {
    "ocr_test.pdf": str(root_path / "tests" / "samples" / "ocr_test.pdf"),
}

def test_rapidocrpdfloader():
    pdf_path = test_files["ocr_test.pdf"]
    from document_loaders import RapidOCRPDFLoader

    loader = RapidOCRPDFLoader(pdf_path)
    docs = loader.load()
    pprint(docs)
    assert isinstance(docs, list) and len(docs) > 0 and isinstance(docs[0].page_content, str)