Spaces:
Running
Running
File size: 497 Bytes
472739a |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 |
import fitz # PyMuPDF
def extract_text_from_pdf(pdf_path: str) -> str:
"""
Extracts text from a PDF file using PyMuPDF.
Args:
pdf_path (str): Path to the PDF file.
Returns:
str: Extracted text content.
"""
try:
doc = fitz.open(pdf_path)
text = ""
for page in doc:
text += page.get_text()
return text
except Exception as e:
print(f"Error reading PDF {pdf_path}: {e}")
return ""
|