fix: change default OCR language from English to Swedish

Project targets Swedish invoice extraction. PaddleOCR sv model provides
better recognition of Swedish-specific characters (å, ä, ö).
This commit is contained in:
Yaojia Wang
2026-02-12 23:19:51 +01:00
parent 58d36c8927
commit d8f2acb762
6 changed files with 8 additions and 8 deletions

View File

@@ -58,7 +58,7 @@ class OCREngine:
def __init__(
self,
lang: str = "en",
lang: str = "sv",
det_model_dir: str | None = None,
rec_model_dir: str | None = None,
use_doc_orientation_classify: bool = True,
@@ -387,7 +387,7 @@ class OCREngine:
def extract_ocr_tokens(
image_path: str | Path,
lang: str = "en",
lang: str = "sv",
page_no: int = 0
) -> list[OCRToken]:
"""