@misc{wangSat Oct 11 2025 09:40:34 GMT+0000 (Coordinated Universal Time)hybridocrllmframework,
title={Hybrid OCR-LLM Framework for Enterprise-Scale Document Information Extraction Under Copy-heavy Task},
author={Zilong Wang and Xiaoyu Shen},
year={Sat Oct 11 2025 09:40:34 GMT+0000 (Coordinated Universal Time)},
eprint={2510.10138},
archivePrefix={arXiv},
primaryClass={cs.AI},
url={https://arxiv.org/abs/2510.10138},
}Transform this paper into an audio lecture
Get an engaging lecture and Q&A format to quickly understand the paper in minutes, perfect for learning on the go.