Spaces:
Sleeping
Sleeping
| import sys | |
| from pathlib import Path | |
| root_path = Path(__file__).parent.parent.parent | |
| sys.path.append(str(root_path)) | |
| from pprint import pprint | |
| test_files = { | |
| "ocr_test.pdf": str(root_path / "tests" / "samples" / "ocr_test.pdf"), | |
| } | |
| def test_rapidocrpdfloader(): | |
| pdf_path = test_files["ocr_test.pdf"] | |
| from document_loaders import RapidOCRPDFLoader | |
| loader = RapidOCRPDFLoader(pdf_path) | |
| docs = loader.load() | |
| pprint(docs) | |
| assert isinstance(docs, list) and len(docs) > 0 and isinstance(docs[0].page_content, str) | |