pdf_file = "example.pdf" pdf_document = fitz.open(pdf_file) text = "" for page_number in range(len(pdf_document)): page = pdf_document.load_page(page_number) for block in page.get_text("blocks"): x0, y0, x1, y1 = block[0:4] text_block = block[4] # 根据文本块属性过滤表...