server/src/app/api/v1/endpoints/ocr.py

from __future__ import annotations

from typing import Annotated

from fastapi import APIRouter, Depends, File, Form, HTTPException, UploadFile, status
from sqlalchemy.orm import Session
from starlette.concurrency import run_in_threadpool

from app.api.deps import CurrentUserContext, get_current_user, get_db
from app.schemas.common import ErrorResponse
from app.schemas.ocr import OcrRecognizeBatchRead
from app.services.ocr import OcrService
from app.services.receipt_folder import ReceiptFolderService

router = APIRouter(prefix="/ocr")


@router.post(
    "/recognize",
    response_model=OcrRecognizeBatchRead,
    summary="识别票据或图片 OCR",
    description="使用 PaddleOCR mobile 模型对上传的图片或 PDF 执行 OCR，并返回结构化文本摘要。",
    responses={
        status.HTTP_400_BAD_REQUEST: {
            "model": ErrorResponse,
            "description": "未上传文件或文件参数非法。",
        },
        status.HTTP_401_UNAUTHORIZED: {
            "model": ErrorResponse,
            "description": "未提供当前登录用户。",
        },
        status.HTTP_503_SERVICE_UNAVAILABLE: {
            "model": ErrorResponse,
            "description": "OCR 运行时不可用或执行失败。",
        },
    },
)
async def recognize_ocr_documents(
    files: Annotated[list[UploadFile], File(description="待识别的票据图片或 PDF。")],
    current_user: Annotated[CurrentUserContext, Depends(get_current_user)],
    db: Annotated[Session, Depends(get_db)],
    receipt_ids: Annotated[list[str] | None, Form(description="可选，来源于票据夹的持久化票据 ID。")] = None,
) -> OcrRecognizeBatchRead:
    try:
        payload = []
        for upload in files:
            payload.append(
                (
                    str(upload.filename or "upload.bin"),
                    await upload.read(),
                    upload.content_type,
                )
            )
        result = await run_in_threadpool(lambda: OcrService(db).recognize_files(payload))
        return ReceiptFolderService().persist_ocr_batch(
            files=payload,
            result=result,
            current_user=current_user,
            receipt_ids=receipt_ids or [],
        )
    except ValueError as exc:
        raise HTTPException(status_code=status.HTTP_400_BAD_REQUEST, detail=str(exc)) from exc
    except RuntimeError as exc:
        raise HTTPException(
            status_code=status.HTTP_503_SERVICE_UNAVAILABLE,
            detail=str(exc),
        ) from exc
-												feat(server): add OCR invoice processing functionality

New endpoints:
- server/src/app/api/v1/endpoints/ocr.py: OCR API endpoints for invoice scanning

New schemas:
- server/src/app/schemas/ocr.py: OCR request/response data schemas

New services:
- server/src/app/services/ocr.py: OCR processing business logic
- server/src/app/services/expense_claims.py: expense claims management service

Scripts:
- server/scripts/bootstrap_paddleocr_mobile.sh: PaddleOCR mobile setup script
- server/scripts/paddle_ocr_worker.py: PaddleOCR worker process

											
										
										
											2026-05-12 03:04:10 +00:00
+								from __future__ import annotations
 								from typing import Annotated
-												feat: 新增票据夹模块并优化 OCR 与员工画像服务

后端新增票据夹端点、数据模型和服务模块，优化 OCR 端点
Schema 和附件操作逻辑，完善员工行为画像服务和辅助函数，
前端新增票据夹视图和服务层，优化文档中心样式和侧边栏导
航，完善员工画像详情弹窗和权限控制，补充单元测试。

											
										
										
											2026-05-29 14:51:18 +08:00
+								from fastapi import APIRouter, Depends, File, Form, HTTPException, UploadFile, status
-												feat(server): 新增文档智能识别服务，扩展OCR接口支持 Azure Document Intelligence

											
										
										
											2026-05-14 09:32:15 +00:00
+								from sqlalchemy.orm import Session
-												feat: 报销审批流重构与管家计划全链路贯通

- 重构报销状态注册表、审批流路由与平台风险标记
- 完善管家意图规划器与模型计划构建器全链路
- 新增 OCR Worker 脚本、数据库会话管理与通知状态
- 优化文档中心、日志视图、预算中心与员工管理交互
- 增强工作台摘要、图标资源与全局主题样式
- 补充审批路由、状态注册、OCR 服务与管家规划器测试覆盖

											
										
										
											2026-06-06 17:19:07 +08:00
+								from starlette.concurrency import run_in_threadpool
-												feat(server): add OCR invoice processing functionality

New endpoints:
- server/src/app/api/v1/endpoints/ocr.py: OCR API endpoints for invoice scanning

New schemas:
- server/src/app/schemas/ocr.py: OCR request/response data schemas

New services:
- server/src/app/services/ocr.py: OCR processing business logic
- server/src/app/services/expense_claims.py: expense claims management service

Scripts:
- server/scripts/bootstrap_paddleocr_mobile.sh: PaddleOCR mobile setup script
- server/scripts/paddle_ocr_worker.py: PaddleOCR worker process

											
										
										
											2026-05-12 03:04:10 +00:00
-												feat(server): 新增文档智能识别服务，扩展OCR接口支持 Azure Document Intelligence

											
										
										
											2026-05-14 09:32:15 +00:00
+								from app.api.deps import CurrentUserContext, get_current_user, get_db
-												feat(server): add OCR invoice processing functionality

New endpoints:
- server/src/app/api/v1/endpoints/ocr.py: OCR API endpoints for invoice scanning

New schemas:
- server/src/app/schemas/ocr.py: OCR request/response data schemas

New services:
- server/src/app/services/ocr.py: OCR processing business logic
- server/src/app/services/expense_claims.py: expense claims management service

Scripts:
- server/scripts/bootstrap_paddleocr_mobile.sh: PaddleOCR mobile setup script
- server/scripts/paddle_ocr_worker.py: PaddleOCR worker process

											
										
										
											2026-05-12 03:04:10 +00:00
+								from app.schemas.common import ErrorResponse
 								from app.schemas.ocr import OcrRecognizeBatchRead
 								from app.services.ocr import OcrService
-												feat: 新增票据夹模块并优化 OCR 与员工画像服务

后端新增票据夹端点、数据模型和服务模块，优化 OCR 端点
Schema 和附件操作逻辑，完善员工行为画像服务和辅助函数，
前端新增票据夹视图和服务层，优化文档中心样式和侧边栏导
航，完善员工画像详情弹窗和权限控制，补充单元测试。

											
										
										
											2026-05-29 14:51:18 +08:00
+								from app.services.receipt_folder import ReceiptFolderService
-												feat(server): add OCR invoice processing functionality

New endpoints:
- server/src/app/api/v1/endpoints/ocr.py: OCR API endpoints for invoice scanning

New schemas:
- server/src/app/schemas/ocr.py: OCR request/response data schemas

New services:
- server/src/app/services/ocr.py: OCR processing business logic
- server/src/app/services/expense_claims.py: expense claims management service

Scripts:
- server/scripts/bootstrap_paddleocr_mobile.sh: PaddleOCR mobile setup script
- server/scripts/paddle_ocr_worker.py: PaddleOCR worker process

											
										
										
											2026-05-12 03:04:10 +00:00
 								router = APIRouter(prefix="/ocr")
 								@router.post(
 								    "/recognize",
 								    response_model=OcrRecognizeBatchRead,
 								    summary="识别票据或图片 OCR",
 								    description="使用 PaddleOCR mobile 模型对上传的图片或 PDF 执行 OCR，并返回结构化文本摘要。",
 								    responses={
 								        status.HTTP_400_BAD_REQUEST: {
 								            "model": ErrorResponse,
 								            "description": "未上传文件或文件参数非法。",
 								        },
 								        status.HTTP_401_UNAUTHORIZED: {
 								            "model": ErrorResponse,
 								            "description": "未提供当前登录用户。",
 								        },
 								        status.HTTP_503_SERVICE_UNAVAILABLE: {
 								            "model": ErrorResponse,
 								            "description": "OCR 运行时不可用或执行失败。",
 								        },
 								    },
 								)
 								async def recognize_ocr_documents(
 								    files: Annotated[list[UploadFile], File(description="待识别的票据图片或 PDF。")],
-												feat: 新增票据夹模块并优化 OCR 与员工画像服务

后端新增票据夹端点、数据模型和服务模块，优化 OCR 端点
Schema 和附件操作逻辑，完善员工行为画像服务和辅助函数，
前端新增票据夹视图和服务层，优化文档中心样式和侧边栏导
航，完善员工画像详情弹窗和权限控制，补充单元测试。

											
										
										
											2026-05-29 14:51:18 +08:00
+								    current_user: Annotated[CurrentUserContext, Depends(get_current_user)],
-												feat(server): 新增文档智能识别服务，扩展OCR接口支持 Azure Document Intelligence

											
										
										
											2026-05-14 09:32:15 +00:00
+								    db: Annotated[Session, Depends(get_db)],
-												feat: 新增票据夹模块并优化 OCR 与员工画像服务

后端新增票据夹端点、数据模型和服务模块，优化 OCR 端点
Schema 和附件操作逻辑，完善员工行为画像服务和辅助函数，
前端新增票据夹视图和服务层，优化文档中心样式和侧边栏导
航，完善员工画像详情弹窗和权限控制，补充单元测试。

											
										
										
											2026-05-29 14:51:18 +08:00
+								    receipt_ids: Annotated[list[str] | None, Form(description="可选，来源于票据夹的持久化票据 ID。")] = None,
-												feat(server): add OCR invoice processing functionality

New endpoints:
- server/src/app/api/v1/endpoints/ocr.py: OCR API endpoints for invoice scanning

New schemas:
- server/src/app/schemas/ocr.py: OCR request/response data schemas

New services:
- server/src/app/services/ocr.py: OCR processing business logic
- server/src/app/services/expense_claims.py: expense claims management service

Scripts:
- server/scripts/bootstrap_paddleocr_mobile.sh: PaddleOCR mobile setup script
- server/scripts/paddle_ocr_worker.py: PaddleOCR worker process

											
										
										
											2026-05-12 03:04:10 +00:00
+								) -> OcrRecognizeBatchRead:
 								    try:
 								        payload = []
 								        for upload in files:
 								            payload.append(
 								                (
 								                    str(upload.filename or "upload.bin"),
 								                    await upload.read(),
 								                    upload.content_type,
 								                )
 								            )
-												feat: 报销审批流重构与管家计划全链路贯通

- 重构报销状态注册表、审批流路由与平台风险标记
- 完善管家意图规划器与模型计划构建器全链路
- 新增 OCR Worker 脚本、数据库会话管理与通知状态
- 优化文档中心、日志视图、预算中心与员工管理交互
- 增强工作台摘要、图标资源与全局主题样式
- 补充审批路由、状态注册、OCR 服务与管家规划器测试覆盖

											
										
										
											2026-06-06 17:19:07 +08:00
+								        result = await run_in_threadpool(lambda: OcrService(db).recognize_files(payload))
-												feat: 新增票据夹模块并优化 OCR 与员工画像服务

后端新增票据夹端点、数据模型和服务模块，优化 OCR 端点
Schema 和附件操作逻辑，完善员工行为画像服务和辅助函数，
前端新增票据夹视图和服务层，优化文档中心样式和侧边栏导
航，完善员工画像详情弹窗和权限控制，补充单元测试。

											
										
										
											2026-05-29 14:51:18 +08:00
+								        return ReceiptFolderService().persist_ocr_batch(
 								            files=payload,
 								            result=result,
 								            current_user=current_user,
 								            receipt_ids=receipt_ids or [],
 								        )
-												feat(server): add OCR invoice processing functionality

New endpoints:
- server/src/app/api/v1/endpoints/ocr.py: OCR API endpoints for invoice scanning

New schemas:
- server/src/app/schemas/ocr.py: OCR request/response data schemas

New services:
- server/src/app/services/ocr.py: OCR processing business logic
- server/src/app/services/expense_claims.py: expense claims management service

Scripts:
- server/scripts/bootstrap_paddleocr_mobile.sh: PaddleOCR mobile setup script
- server/scripts/paddle_ocr_worker.py: PaddleOCR worker process

											
										
										
											2026-05-12 03:04:10 +00:00
+								    except ValueError as exc:
 								        raise HTTPException(status_code=status.HTTP_400_BAD_REQUEST, detail=str(exc)) from exc
 								    except RuntimeError as exc:
 								        raise HTTPException(
 								            status_code=status.HTTP_503_SERVICE_UNAVAILABLE,
 								            detail=str(exc),
 								        ) from exc