from upsonic.ocr import OCR
from upsonic.ocr.layer_1.engines import (
PaddleOCREngine, PPStructureV3Engine,
PPChatOCRv4Engine, PaddleOCRVLEngine
)
# Also available: from upsonic.ocr import PaddleOCREngine, PPStructureV3Engine, ...
# General OCR (PP-OCRv5)
engine = PaddleOCREngine(lang='en', ocr_version='PP-OCRv5')
ocr = OCR(layer_1_ocr_engine=engine)
text = ocr.get_text('document.pdf')
# Advanced document structure recognition
engine_structure = PPStructureV3Engine(
use_table_recognition=True,
use_formula_recognition=True
)
ocr_structure = OCR(layer_1_ocr_engine=engine_structure)
result = ocr_structure.process_file('research_paper.pdf')
# Chat-based document understanding
engine_chat = PPChatOCRv4Engine(
use_table_recognition=True,
use_seal_recognition=True
)
ocr_chat = OCR(layer_1_ocr_engine=engine_chat)
# Vision-Language document understanding
engine_vl = PaddleOCRVLEngine(
use_layout_detection=True,
use_chart_recognition=True,
format_block_content=True
)
ocr_vl = OCR(layer_1_ocr_engine=engine_vl)