restructure project

This commit is contained in:
Yaojia Wang
2026-01-27 23:58:17 +01:00
parent 58bf75db68
commit d6550375b0
230 changed files with 5513 additions and 1756 deletions

View File

@@ -12,7 +12,7 @@ Usage:
import pytest
from pathlib import Path
from unittest.mock import patch, MagicMock
from src.pdf.extractor import (
from shared.pdf.extractor import (
Token,
PDFDocument,
extract_text_tokens,
@@ -509,7 +509,7 @@ class TestPDFDocumentIsTextPDF:
mock_doc = MagicMock()
with patch("fitz.open", return_value=mock_doc):
with patch("src.pdf.extractor._is_text_pdf_standalone", return_value=True) as mock_check:
with patch("shared.pdf.extractor._is_text_pdf_standalone", return_value=True) as mock_check:
with PDFDocument("test.pdf") as pdf:
result = pdf.is_text_pdf(min_chars=50)