diff --git a/ocr-service/main.py b/ocr-service/main.py index 73dbef28..558c91d3 100644 --- a/ocr-service/main.py +++ b/ocr-service/main.py @@ -56,9 +56,9 @@ async def run_ocr(request: OcrRequest): if not _models_ready: raise HTTPException(status_code=503, detail="Models not loaded yet") - images = await _download_and_convert_pdf(request.pdf_url) + images = await _download_and_convert_pdf(request.pdfUrl) - script_type = request.script_type.upper() + script_type = request.scriptType.upper() if script_type == "HANDWRITING_KURRENT": if not kraken_engine.is_available(): diff --git a/ocr-service/models.py b/ocr-service/models.py index 0d2c1590..f58bd5c3 100644 --- a/ocr-service/models.py +++ b/ocr-service/models.py @@ -1,20 +1,21 @@ -from pydantic import BaseModel, Field +from pydantic import BaseModel, ConfigDict class OcrRequest(BaseModel): - pdf_url: str = Field(..., alias="pdfUrl") - script_type: str = Field("UNKNOWN", alias="scriptType") + model_config = ConfigDict(populate_by_name=True) + + pdfUrl: str + scriptType: str = "UNKNOWN" language: str = "de" class OcrBlock(BaseModel): - page_number: int = Field(..., alias="pageNumber") + model_config = ConfigDict(populate_by_name=True) + + pageNumber: int x: float y: float width: float height: float polygon: list[list[float]] | None = None text: str - - class Config: - populate_by_name = True