huggingface_hub>=0.20.0 python-docx scikit-learn pdfplumber numpy fpdf2