fix: change default OCR language from English to Swedish
Project targets Swedish invoice extraction. PaddleOCR sv model provides better recognition of Swedish-specific characters (å, ä, ö).
This commit is contained in:
@@ -58,7 +58,7 @@ class OCREngine:
|
||||
|
||||
def __init__(
|
||||
self,
|
||||
lang: str = "en",
|
||||
lang: str = "sv",
|
||||
det_model_dir: str | None = None,
|
||||
rec_model_dir: str | None = None,
|
||||
use_doc_orientation_classify: bool = True,
|
||||
@@ -387,7 +387,7 @@ class OCREngine:
|
||||
|
||||
def extract_ocr_tokens(
|
||||
image_path: str | Path,
|
||||
lang: str = "en",
|
||||
lang: str = "sv",
|
||||
page_no: int = 0
|
||||
) -> list[OCRToken]:
|
||||
"""
|
||||
|
||||
Reference in New Issue
Block a user