hmh_ocr.py 256 Bytes Raw Blame History Permalink 1 2 3 4 5 6 7 8 9 10 from .retriever import HMHRetriever from .tools import pdf_info_rebuild hmh_retriever = HMHRetriever() def predict(pdf_info): pdf_text_list, _ = pdf_info_rebuild(pdf_info, fix_bbox=False) return hmh_retriever.get_target_fields(pdf_text_list)